Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .DS_Store +0 -0
- .gitattributes +1 -0
- config.json +4 -0
- merges.txt +0 -0
- meta.yaml +24 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/analytics/coremldata.bin +3 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/coremldata.bin +3 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/metadata.json +299 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/model.mil +0 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/weights/weight.bin +3 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/analytics/coremldata.bin +3 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/coremldata.bin +3 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/metadata.json +299 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/model.mil +0 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/weights/weight.bin +3 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
- phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_FFN_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
- phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_FFN_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
- phi4_embeddings_lut8.mlmodelc/analytics/coremldata.bin +3 -0
- phi4_embeddings_lut8.mlmodelc/coremldata.bin +3 -0
- phi4_embeddings_lut8.mlmodelc/metadata.json +65 -0
- phi4_embeddings_lut8.mlmodelc/model.mil +21 -0
- phi4_embeddings_lut8.mlmodelc/weights/weight.bin +3 -0
- phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_embeddings_lut8.mlpackage/Manifest.json +18 -0
- phi4_lm_head_lut6.mlmodelc/analytics/coremldata.bin +3 -0
- phi4_lm_head_lut6.mlmodelc/coremldata.bin +3 -0
- phi4_lm_head_lut6.mlmodelc/metadata.json +63 -0
- phi4_lm_head_lut6.mlmodelc/model.mil +17 -0
- phi4_lm_head_lut6.mlmodelc/weights/weight.bin +3 -0
- phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_lm_head_lut6.mlpackage/Manifest.json +18 -0
- phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_prefill_lut4_chunk_01of02.mlpackage/Manifest.json +18 -0
- phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel +3 -0
- phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin +3 -0
- phi4_prefill_lut4_chunk_02of02.mlpackage/Manifest.json +18 -0
- tokenizer.json +3 -0
.DS_Store
ADDED
|
Binary file (6.15 kB). View file
|
|
|
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"tokenizer_class": "AutoTokenizer",
|
| 3 |
+
"model_type": "phi3"
|
| 4 |
+
}
|
merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
meta.yaml
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model_info:
|
| 2 |
+
name: anemll-5a149550068a1eb93398160d8953f5f56c3603e9-ctx2048
|
| 3 |
+
version: 0.3.0
|
| 4 |
+
description: |
|
| 5 |
+
Demonstarates running 5a149550068a1eb93398160d8953f5f56c3603e9 on Apple Neural Engine
|
| 6 |
+
Context length: 2048
|
| 7 |
+
Batch size: 64
|
| 8 |
+
Chunks: 2
|
| 9 |
+
license: MIT
|
| 10 |
+
author: Anemll
|
| 11 |
+
framework: Core ML
|
| 12 |
+
language: Python
|
| 13 |
+
parameters:
|
| 14 |
+
context_length: 2048
|
| 15 |
+
batch_size: 64
|
| 16 |
+
lut_embeddings: 8
|
| 17 |
+
lut_ffn: 4
|
| 18 |
+
lut_lmhead: 6
|
| 19 |
+
num_chunks: 2
|
| 20 |
+
model_prefix: phi4
|
| 21 |
+
embeddings: phi4_embeddings_lut8.mlmodelc
|
| 22 |
+
lm_head: phi4_lm_head_lut6.mlmodelc
|
| 23 |
+
ffn: phi4_FFN_PF_lut4.mlmodelc
|
| 24 |
+
split_lm_head: 1
|
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9100ee1f47c46d82899674cb8dd1267b7b3be5159f56687398744760d68e748a
|
| 3 |
+
size 243
|
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dea759822bbf8031a58a2da1da1d9cca24edc09a4ba2c8a1d49917d5cc02716
|
| 3 |
+
size 743
|
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,299 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"userDefinedMetadata" : {
|
| 5 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript",
|
| 6 |
+
"com.github.apple.coremltools.source" : "torch==2.8.0",
|
| 7 |
+
"com.github.apple.coremltools.version" : "9.0b1",
|
| 8 |
+
"com.anemll.info" : "Converted with Anemll v0.3.4"
|
| 9 |
+
},
|
| 10 |
+
"availability" : {
|
| 11 |
+
"macOS" : "15.0",
|
| 12 |
+
"tvOS" : "18.0",
|
| 13 |
+
"visionOS" : "2.0",
|
| 14 |
+
"watchOS" : "11.0",
|
| 15 |
+
"iOS" : "18.0",
|
| 16 |
+
"macCatalyst" : "18.0"
|
| 17 |
+
},
|
| 18 |
+
"inputSchema" : [
|
| 19 |
+
{
|
| 20 |
+
"hasShapeFlexibility" : "0",
|
| 21 |
+
"isOptional" : "0",
|
| 22 |
+
"dataType" : "Float16",
|
| 23 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 24 |
+
"shortDescription" : "",
|
| 25 |
+
"shape" : "[1, 1, 3072]",
|
| 26 |
+
"name" : "hidden_states",
|
| 27 |
+
"type" : "MultiArray"
|
| 28 |
+
},
|
| 29 |
+
{
|
| 30 |
+
"hasShapeFlexibility" : "0",
|
| 31 |
+
"isOptional" : "0",
|
| 32 |
+
"dataType" : "Int32",
|
| 33 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 34 |
+
"shortDescription" : "",
|
| 35 |
+
"shape" : "[1]",
|
| 36 |
+
"name" : "position_ids",
|
| 37 |
+
"type" : "MultiArray"
|
| 38 |
+
},
|
| 39 |
+
{
|
| 40 |
+
"hasShapeFlexibility" : "0",
|
| 41 |
+
"isOptional" : "0",
|
| 42 |
+
"dataType" : "Float16",
|
| 43 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
|
| 44 |
+
"shortDescription" : "",
|
| 45 |
+
"shape" : "[1, 1, 1, 2048]",
|
| 46 |
+
"name" : "causal_mask",
|
| 47 |
+
"type" : "MultiArray"
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"hasShapeFlexibility" : "0",
|
| 51 |
+
"isOptional" : "0",
|
| 52 |
+
"dataType" : "Int32",
|
| 53 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 54 |
+
"shortDescription" : "",
|
| 55 |
+
"shape" : "[1]",
|
| 56 |
+
"name" : "current_pos",
|
| 57 |
+
"type" : "MultiArray"
|
| 58 |
+
}
|
| 59 |
+
],
|
| 60 |
+
"outputSchema" : [
|
| 61 |
+
{
|
| 62 |
+
"hasShapeFlexibility" : "0",
|
| 63 |
+
"isOptional" : "0",
|
| 64 |
+
"dataType" : "Float16",
|
| 65 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 66 |
+
"shortDescription" : "",
|
| 67 |
+
"shape" : "[1, 1, 3072]",
|
| 68 |
+
"name" : "output_hidden_states",
|
| 69 |
+
"type" : "MultiArray"
|
| 70 |
+
}
|
| 71 |
+
],
|
| 72 |
+
"modelParameters" : [
|
| 73 |
+
|
| 74 |
+
],
|
| 75 |
+
"storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 76 |
+
"method" : "predict",
|
| 77 |
+
"functions" : [
|
| 78 |
+
{
|
| 79 |
+
"inputSchema" : [
|
| 80 |
+
{
|
| 81 |
+
"hasShapeFlexibility" : "0",
|
| 82 |
+
"isOptional" : "0",
|
| 83 |
+
"dataType" : "Float16",
|
| 84 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 85 |
+
"shortDescription" : "",
|
| 86 |
+
"shape" : "[1, 1, 3072]",
|
| 87 |
+
"name" : "hidden_states",
|
| 88 |
+
"type" : "MultiArray"
|
| 89 |
+
},
|
| 90 |
+
{
|
| 91 |
+
"hasShapeFlexibility" : "0",
|
| 92 |
+
"isOptional" : "0",
|
| 93 |
+
"dataType" : "Int32",
|
| 94 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 95 |
+
"shortDescription" : "",
|
| 96 |
+
"shape" : "[1]",
|
| 97 |
+
"name" : "position_ids",
|
| 98 |
+
"type" : "MultiArray"
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"hasShapeFlexibility" : "0",
|
| 102 |
+
"isOptional" : "0",
|
| 103 |
+
"dataType" : "Float16",
|
| 104 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
|
| 105 |
+
"shortDescription" : "",
|
| 106 |
+
"shape" : "[1, 1, 1, 2048]",
|
| 107 |
+
"name" : "causal_mask",
|
| 108 |
+
"type" : "MultiArray"
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"hasShapeFlexibility" : "0",
|
| 112 |
+
"isOptional" : "0",
|
| 113 |
+
"dataType" : "Int32",
|
| 114 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 115 |
+
"shortDescription" : "",
|
| 116 |
+
"shape" : "[1]",
|
| 117 |
+
"name" : "current_pos",
|
| 118 |
+
"type" : "MultiArray"
|
| 119 |
+
}
|
| 120 |
+
],
|
| 121 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 122 |
+
"storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 123 |
+
"stateSchema" : [
|
| 124 |
+
|
| 125 |
+
],
|
| 126 |
+
"outputSchema" : [
|
| 127 |
+
{
|
| 128 |
+
"hasShapeFlexibility" : "0",
|
| 129 |
+
"isOptional" : "0",
|
| 130 |
+
"dataType" : "Float16",
|
| 131 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 132 |
+
"shortDescription" : "",
|
| 133 |
+
"shape" : "[1, 1, 3072]",
|
| 134 |
+
"name" : "output_hidden_states",
|
| 135 |
+
"type" : "MultiArray"
|
| 136 |
+
}
|
| 137 |
+
],
|
| 138 |
+
"name" : "infer",
|
| 139 |
+
"mlProgramOperationTypeHistogram" : {
|
| 140 |
+
"Ios18.expandDims" : 69,
|
| 141 |
+
"Ios18.mul" : 194,
|
| 142 |
+
"Ios18.cos" : 1,
|
| 143 |
+
"Ios18.softmax" : 16,
|
| 144 |
+
"Ios18.matmul" : 33,
|
| 145 |
+
"Ios18.rsqrt" : 33,
|
| 146 |
+
"Identity" : 2,
|
| 147 |
+
"Ios16.reduceMean" : 33,
|
| 148 |
+
"Ios18.sin" : 1,
|
| 149 |
+
"Split" : 16,
|
| 150 |
+
"Select" : 1,
|
| 151 |
+
"Tile" : 32,
|
| 152 |
+
"Ios18.add" : 113,
|
| 153 |
+
"Ios16.fillLike" : 1,
|
| 154 |
+
"Ios18.sliceUpdate" : 32,
|
| 155 |
+
"Ios18.reshape" : 99,
|
| 156 |
+
"Ios18.constexprLutToDense" : 97,
|
| 157 |
+
"Ios18.conv" : 96,
|
| 158 |
+
"Ios18.concat" : 65,
|
| 159 |
+
"Ios18.cast" : 1,
|
| 160 |
+
"Ios18.transpose" : 18,
|
| 161 |
+
"Ios18.pow" : 33,
|
| 162 |
+
"Ios18.silu" : 16,
|
| 163 |
+
"Ios18.lessEqual" : 1,
|
| 164 |
+
"Ios18.sliceByIndex" : 160,
|
| 165 |
+
"Ios18.squeeze" : 16
|
| 166 |
+
}
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"inputSchema" : [
|
| 170 |
+
{
|
| 171 |
+
"hasShapeFlexibility" : "0",
|
| 172 |
+
"isOptional" : "0",
|
| 173 |
+
"dataType" : "Float16",
|
| 174 |
+
"formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
|
| 175 |
+
"shortDescription" : "",
|
| 176 |
+
"shape" : "[1, 64, 3072]",
|
| 177 |
+
"name" : "hidden_states",
|
| 178 |
+
"type" : "MultiArray"
|
| 179 |
+
},
|
| 180 |
+
{
|
| 181 |
+
"hasShapeFlexibility" : "0",
|
| 182 |
+
"isOptional" : "0",
|
| 183 |
+
"dataType" : "Int32",
|
| 184 |
+
"formattedType" : "MultiArray (Int32 64)",
|
| 185 |
+
"shortDescription" : "",
|
| 186 |
+
"shape" : "[64]",
|
| 187 |
+
"name" : "position_ids",
|
| 188 |
+
"type" : "MultiArray"
|
| 189 |
+
},
|
| 190 |
+
{
|
| 191 |
+
"hasShapeFlexibility" : "0",
|
| 192 |
+
"isOptional" : "0",
|
| 193 |
+
"dataType" : "Float16",
|
| 194 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 64 × 2048)",
|
| 195 |
+
"shortDescription" : "",
|
| 196 |
+
"shape" : "[1, 1, 64, 2048]",
|
| 197 |
+
"name" : "causal_mask",
|
| 198 |
+
"type" : "MultiArray"
|
| 199 |
+
},
|
| 200 |
+
{
|
| 201 |
+
"hasShapeFlexibility" : "0",
|
| 202 |
+
"isOptional" : "0",
|
| 203 |
+
"dataType" : "Int32",
|
| 204 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 205 |
+
"shortDescription" : "",
|
| 206 |
+
"shape" : "[1]",
|
| 207 |
+
"name" : "current_pos",
|
| 208 |
+
"type" : "MultiArray"
|
| 209 |
+
}
|
| 210 |
+
],
|
| 211 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 212 |
+
"storagePrecision" : "Mixed (Float16, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 213 |
+
"stateSchema" : [
|
| 214 |
+
|
| 215 |
+
],
|
| 216 |
+
"outputSchema" : [
|
| 217 |
+
{
|
| 218 |
+
"hasShapeFlexibility" : "0",
|
| 219 |
+
"isOptional" : "0",
|
| 220 |
+
"dataType" : "Float16",
|
| 221 |
+
"formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
|
| 222 |
+
"shortDescription" : "",
|
| 223 |
+
"shape" : "[1, 64, 3072]",
|
| 224 |
+
"name" : "output_hidden_states",
|
| 225 |
+
"type" : "MultiArray"
|
| 226 |
+
}
|
| 227 |
+
],
|
| 228 |
+
"name" : "prefill",
|
| 229 |
+
"mlProgramOperationTypeHistogram" : {
|
| 230 |
+
"Ios18.expandDims" : 67,
|
| 231 |
+
"Ios18.softmax" : 16,
|
| 232 |
+
"Ios18.cos" : 1,
|
| 233 |
+
"Ios18.mul" : 192,
|
| 234 |
+
"Ios18.matmul" : 33,
|
| 235 |
+
"Ios18.rsqrt" : 32,
|
| 236 |
+
"Identity" : 2,
|
| 237 |
+
"Ios16.reduceMean" : 32,
|
| 238 |
+
"Ios18.sin" : 1,
|
| 239 |
+
"Split" : 16,
|
| 240 |
+
"Tile" : 32,
|
| 241 |
+
"Ios18.add" : 112,
|
| 242 |
+
"Ios18.sliceUpdate" : 32,
|
| 243 |
+
"Ios18.reshape" : 98,
|
| 244 |
+
"Ios18.constexprLutToDense" : 97,
|
| 245 |
+
"Ios18.conv" : 96,
|
| 246 |
+
"Ios18.concat" : 65,
|
| 247 |
+
"Ios18.cast" : 1,
|
| 248 |
+
"Ios18.transpose" : 80,
|
| 249 |
+
"Ios18.pow" : 32,
|
| 250 |
+
"Ios18.silu" : 16,
|
| 251 |
+
"Ios18.sliceByIndex" : 160,
|
| 252 |
+
"Ios18.squeeze" : 16
|
| 253 |
+
}
|
| 254 |
+
}
|
| 255 |
+
],
|
| 256 |
+
"version" : "0.3.4",
|
| 257 |
+
"isUpdatable" : "0",
|
| 258 |
+
"defaultFunctionName" : "infer",
|
| 259 |
+
"specificationVersion" : 9,
|
| 260 |
+
"stateSchema" : [
|
| 261 |
+
|
| 262 |
+
],
|
| 263 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 264 |
+
"mlProgramOperationTypeHistogram" : {
|
| 265 |
+
"Ios18.expandDims" : 69,
|
| 266 |
+
"Ios18.mul" : 194,
|
| 267 |
+
"Ios18.cos" : 1,
|
| 268 |
+
"Ios18.softmax" : 16,
|
| 269 |
+
"Ios18.matmul" : 33,
|
| 270 |
+
"Ios18.rsqrt" : 33,
|
| 271 |
+
"Identity" : 2,
|
| 272 |
+
"Ios16.reduceMean" : 33,
|
| 273 |
+
"Ios18.sin" : 1,
|
| 274 |
+
"Split" : 16,
|
| 275 |
+
"Select" : 1,
|
| 276 |
+
"Tile" : 32,
|
| 277 |
+
"Ios18.add" : 113,
|
| 278 |
+
"Ios16.fillLike" : 1,
|
| 279 |
+
"Ios18.sliceUpdate" : 32,
|
| 280 |
+
"Ios18.reshape" : 99,
|
| 281 |
+
"Ios18.constexprLutToDense" : 97,
|
| 282 |
+
"Ios18.conv" : 96,
|
| 283 |
+
"Ios18.concat" : 65,
|
| 284 |
+
"Ios18.cast" : 1,
|
| 285 |
+
"Ios18.transpose" : 18,
|
| 286 |
+
"Ios18.pow" : 33,
|
| 287 |
+
"Ios18.silu" : 16,
|
| 288 |
+
"Ios18.lessEqual" : 1,
|
| 289 |
+
"Ios18.sliceByIndex" : 160,
|
| 290 |
+
"Ios18.squeeze" : 16
|
| 291 |
+
},
|
| 292 |
+
"shortDescription" : "Anemll Model: Multifunction Combined",
|
| 293 |
+
"generatedClassName" : "phi4_FFN_PF_lut4_chunk_01of02",
|
| 294 |
+
"author" : "Converted with Anemll v0.3.4",
|
| 295 |
+
"modelType" : {
|
| 296 |
+
"name" : "MLModelType_mlProgram"
|
| 297 |
+
}
|
| 298 |
+
}
|
| 299 |
+
]
|
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/model.mil
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
phi4_FFN_PF_lut4_chunk_01of02.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9b1a80fd917817620853cba6084cc50181eb31bebd4b51c03242c3a60714cfa
|
| 3 |
+
size 942252864
|
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ab2caaac8f312247b29b5373e405721bb43fc2afd9981a0d0969c8aeb367071
|
| 3 |
+
size 946777
|
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9b1a80fd917817620853cba6084cc50181eb31bebd4b51c03242c3a60714cfa
|
| 3 |
+
size 942252864
|
phi4_FFN_PF_lut4_chunk_01of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"3ED36C90-09E7-454E-993A-613AD9D0DBA7": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"56CB52E7-E373-4A88-A618-FABF77025DEB": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "3ED36C90-09E7-454E-993A-613AD9D0DBA7"
|
| 18 |
+
}
|
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d459fd207688db500187a3718f7e766ec41fcd451e5e5c621a05d084d401385a
|
| 3 |
+
size 243
|
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:572b886153dff5be6f240438c1f30e1c5effc7454ae5f9915baa30719bbe7fe7
|
| 3 |
+
size 743
|
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,299 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"userDefinedMetadata" : {
|
| 5 |
+
"com.github.apple.coremltools.version" : "9.0b1",
|
| 6 |
+
"com.github.apple.coremltools.source" : "torch==2.8.0",
|
| 7 |
+
"com.anemll.info" : "Converted with Anemll v0.3.4",
|
| 8 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 9 |
+
},
|
| 10 |
+
"availability" : {
|
| 11 |
+
"macOS" : "15.0",
|
| 12 |
+
"tvOS" : "18.0",
|
| 13 |
+
"visionOS" : "2.0",
|
| 14 |
+
"watchOS" : "11.0",
|
| 15 |
+
"iOS" : "18.0",
|
| 16 |
+
"macCatalyst" : "18.0"
|
| 17 |
+
},
|
| 18 |
+
"inputSchema" : [
|
| 19 |
+
{
|
| 20 |
+
"hasShapeFlexibility" : "0",
|
| 21 |
+
"isOptional" : "0",
|
| 22 |
+
"dataType" : "Float16",
|
| 23 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 24 |
+
"shortDescription" : "",
|
| 25 |
+
"shape" : "[1, 1, 3072]",
|
| 26 |
+
"name" : "hidden_states",
|
| 27 |
+
"type" : "MultiArray"
|
| 28 |
+
},
|
| 29 |
+
{
|
| 30 |
+
"hasShapeFlexibility" : "0",
|
| 31 |
+
"isOptional" : "0",
|
| 32 |
+
"dataType" : "Int32",
|
| 33 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 34 |
+
"shortDescription" : "",
|
| 35 |
+
"shape" : "[1]",
|
| 36 |
+
"name" : "position_ids",
|
| 37 |
+
"type" : "MultiArray"
|
| 38 |
+
},
|
| 39 |
+
{
|
| 40 |
+
"hasShapeFlexibility" : "0",
|
| 41 |
+
"isOptional" : "0",
|
| 42 |
+
"dataType" : "Float16",
|
| 43 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
|
| 44 |
+
"shortDescription" : "",
|
| 45 |
+
"shape" : "[1, 1, 1, 2048]",
|
| 46 |
+
"name" : "causal_mask",
|
| 47 |
+
"type" : "MultiArray"
|
| 48 |
+
},
|
| 49 |
+
{
|
| 50 |
+
"hasShapeFlexibility" : "0",
|
| 51 |
+
"isOptional" : "0",
|
| 52 |
+
"dataType" : "Int32",
|
| 53 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 54 |
+
"shortDescription" : "",
|
| 55 |
+
"shape" : "[1]",
|
| 56 |
+
"name" : "current_pos",
|
| 57 |
+
"type" : "MultiArray"
|
| 58 |
+
}
|
| 59 |
+
],
|
| 60 |
+
"outputSchema" : [
|
| 61 |
+
{
|
| 62 |
+
"hasShapeFlexibility" : "0",
|
| 63 |
+
"isOptional" : "0",
|
| 64 |
+
"dataType" : "Float16",
|
| 65 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 66 |
+
"shortDescription" : "",
|
| 67 |
+
"shape" : "[1, 1, 3072]",
|
| 68 |
+
"name" : "output_hidden_states",
|
| 69 |
+
"type" : "MultiArray"
|
| 70 |
+
}
|
| 71 |
+
],
|
| 72 |
+
"modelParameters" : [
|
| 73 |
+
|
| 74 |
+
],
|
| 75 |
+
"storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 76 |
+
"method" : "predict",
|
| 77 |
+
"functions" : [
|
| 78 |
+
{
|
| 79 |
+
"inputSchema" : [
|
| 80 |
+
{
|
| 81 |
+
"hasShapeFlexibility" : "0",
|
| 82 |
+
"isOptional" : "0",
|
| 83 |
+
"dataType" : "Float16",
|
| 84 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 85 |
+
"shortDescription" : "",
|
| 86 |
+
"shape" : "[1, 1, 3072]",
|
| 87 |
+
"name" : "hidden_states",
|
| 88 |
+
"type" : "MultiArray"
|
| 89 |
+
},
|
| 90 |
+
{
|
| 91 |
+
"hasShapeFlexibility" : "0",
|
| 92 |
+
"isOptional" : "0",
|
| 93 |
+
"dataType" : "Int32",
|
| 94 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 95 |
+
"shortDescription" : "",
|
| 96 |
+
"shape" : "[1]",
|
| 97 |
+
"name" : "position_ids",
|
| 98 |
+
"type" : "MultiArray"
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"hasShapeFlexibility" : "0",
|
| 102 |
+
"isOptional" : "0",
|
| 103 |
+
"dataType" : "Float16",
|
| 104 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 1 × 2048)",
|
| 105 |
+
"shortDescription" : "",
|
| 106 |
+
"shape" : "[1, 1, 1, 2048]",
|
| 107 |
+
"name" : "causal_mask",
|
| 108 |
+
"type" : "MultiArray"
|
| 109 |
+
},
|
| 110 |
+
{
|
| 111 |
+
"hasShapeFlexibility" : "0",
|
| 112 |
+
"isOptional" : "0",
|
| 113 |
+
"dataType" : "Int32",
|
| 114 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 115 |
+
"shortDescription" : "",
|
| 116 |
+
"shape" : "[1]",
|
| 117 |
+
"name" : "current_pos",
|
| 118 |
+
"type" : "MultiArray"
|
| 119 |
+
}
|
| 120 |
+
],
|
| 121 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 122 |
+
"storagePrecision" : "Mixed (Float16, Int32, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 123 |
+
"stateSchema" : [
|
| 124 |
+
|
| 125 |
+
],
|
| 126 |
+
"outputSchema" : [
|
| 127 |
+
{
|
| 128 |
+
"hasShapeFlexibility" : "0",
|
| 129 |
+
"isOptional" : "0",
|
| 130 |
+
"dataType" : "Float16",
|
| 131 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 132 |
+
"shortDescription" : "",
|
| 133 |
+
"shape" : "[1, 1, 3072]",
|
| 134 |
+
"name" : "output_hidden_states",
|
| 135 |
+
"type" : "MultiArray"
|
| 136 |
+
}
|
| 137 |
+
],
|
| 138 |
+
"name" : "infer",
|
| 139 |
+
"mlProgramOperationTypeHistogram" : {
|
| 140 |
+
"Ios18.expandDims" : 69,
|
| 141 |
+
"Ios18.mul" : 194,
|
| 142 |
+
"Ios18.cos" : 1,
|
| 143 |
+
"Ios18.softmax" : 16,
|
| 144 |
+
"Ios18.matmul" : 33,
|
| 145 |
+
"Ios18.rsqrt" : 33,
|
| 146 |
+
"Identity" : 2,
|
| 147 |
+
"Ios16.reduceMean" : 33,
|
| 148 |
+
"Ios18.sin" : 1,
|
| 149 |
+
"Split" : 16,
|
| 150 |
+
"Select" : 1,
|
| 151 |
+
"Tile" : 32,
|
| 152 |
+
"Ios18.add" : 113,
|
| 153 |
+
"Ios16.fillLike" : 1,
|
| 154 |
+
"Ios18.sliceUpdate" : 32,
|
| 155 |
+
"Ios18.reshape" : 99,
|
| 156 |
+
"Ios18.constexprLutToDense" : 97,
|
| 157 |
+
"Ios18.conv" : 96,
|
| 158 |
+
"Ios18.concat" : 65,
|
| 159 |
+
"Ios18.cast" : 1,
|
| 160 |
+
"Ios18.transpose" : 18,
|
| 161 |
+
"Ios18.pow" : 33,
|
| 162 |
+
"Ios18.silu" : 16,
|
| 163 |
+
"Ios18.lessEqual" : 1,
|
| 164 |
+
"Ios18.sliceByIndex" : 160,
|
| 165 |
+
"Ios18.squeeze" : 16
|
| 166 |
+
}
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"inputSchema" : [
|
| 170 |
+
{
|
| 171 |
+
"hasShapeFlexibility" : "0",
|
| 172 |
+
"isOptional" : "0",
|
| 173 |
+
"dataType" : "Float16",
|
| 174 |
+
"formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
|
| 175 |
+
"shortDescription" : "",
|
| 176 |
+
"shape" : "[1, 64, 3072]",
|
| 177 |
+
"name" : "hidden_states",
|
| 178 |
+
"type" : "MultiArray"
|
| 179 |
+
},
|
| 180 |
+
{
|
| 181 |
+
"hasShapeFlexibility" : "0",
|
| 182 |
+
"isOptional" : "0",
|
| 183 |
+
"dataType" : "Int32",
|
| 184 |
+
"formattedType" : "MultiArray (Int32 64)",
|
| 185 |
+
"shortDescription" : "",
|
| 186 |
+
"shape" : "[64]",
|
| 187 |
+
"name" : "position_ids",
|
| 188 |
+
"type" : "MultiArray"
|
| 189 |
+
},
|
| 190 |
+
{
|
| 191 |
+
"hasShapeFlexibility" : "0",
|
| 192 |
+
"isOptional" : "0",
|
| 193 |
+
"dataType" : "Float16",
|
| 194 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 64 × 2048)",
|
| 195 |
+
"shortDescription" : "",
|
| 196 |
+
"shape" : "[1, 1, 64, 2048]",
|
| 197 |
+
"name" : "causal_mask",
|
| 198 |
+
"type" : "MultiArray"
|
| 199 |
+
},
|
| 200 |
+
{
|
| 201 |
+
"hasShapeFlexibility" : "0",
|
| 202 |
+
"isOptional" : "0",
|
| 203 |
+
"dataType" : "Int32",
|
| 204 |
+
"formattedType" : "MultiArray (Int32 1)",
|
| 205 |
+
"shortDescription" : "",
|
| 206 |
+
"shape" : "[1]",
|
| 207 |
+
"name" : "current_pos",
|
| 208 |
+
"type" : "MultiArray"
|
| 209 |
+
}
|
| 210 |
+
],
|
| 211 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 212 |
+
"storagePrecision" : "Mixed (Float16, Palettized (11 bits), Palettized (13 bits), Palettized (15 bits), Palettized (7 bits), UInt4)",
|
| 213 |
+
"stateSchema" : [
|
| 214 |
+
|
| 215 |
+
],
|
| 216 |
+
"outputSchema" : [
|
| 217 |
+
{
|
| 218 |
+
"hasShapeFlexibility" : "0",
|
| 219 |
+
"isOptional" : "0",
|
| 220 |
+
"dataType" : "Float16",
|
| 221 |
+
"formattedType" : "MultiArray (Float16 1 × 64 × 3072)",
|
| 222 |
+
"shortDescription" : "",
|
| 223 |
+
"shape" : "[1, 64, 3072]",
|
| 224 |
+
"name" : "output_hidden_states",
|
| 225 |
+
"type" : "MultiArray"
|
| 226 |
+
}
|
| 227 |
+
],
|
| 228 |
+
"name" : "prefill",
|
| 229 |
+
"mlProgramOperationTypeHistogram" : {
|
| 230 |
+
"Ios18.expandDims" : 67,
|
| 231 |
+
"Ios18.softmax" : 16,
|
| 232 |
+
"Ios18.cos" : 1,
|
| 233 |
+
"Ios18.mul" : 192,
|
| 234 |
+
"Ios18.matmul" : 33,
|
| 235 |
+
"Ios18.rsqrt" : 32,
|
| 236 |
+
"Identity" : 2,
|
| 237 |
+
"Ios16.reduceMean" : 32,
|
| 238 |
+
"Ios18.sin" : 1,
|
| 239 |
+
"Split" : 16,
|
| 240 |
+
"Tile" : 32,
|
| 241 |
+
"Ios18.add" : 112,
|
| 242 |
+
"Ios18.sliceUpdate" : 32,
|
| 243 |
+
"Ios18.reshape" : 98,
|
| 244 |
+
"Ios18.constexprLutToDense" : 97,
|
| 245 |
+
"Ios18.conv" : 96,
|
| 246 |
+
"Ios18.concat" : 65,
|
| 247 |
+
"Ios18.cast" : 1,
|
| 248 |
+
"Ios18.transpose" : 80,
|
| 249 |
+
"Ios18.pow" : 32,
|
| 250 |
+
"Ios18.silu" : 16,
|
| 251 |
+
"Ios18.sliceByIndex" : 160,
|
| 252 |
+
"Ios18.squeeze" : 16
|
| 253 |
+
}
|
| 254 |
+
}
|
| 255 |
+
],
|
| 256 |
+
"version" : "0.3.4",
|
| 257 |
+
"isUpdatable" : "0",
|
| 258 |
+
"defaultFunctionName" : "infer",
|
| 259 |
+
"specificationVersion" : 9,
|
| 260 |
+
"stateSchema" : [
|
| 261 |
+
|
| 262 |
+
],
|
| 263 |
+
"computePrecision" : "Mixed (Float16, Float32, Int32)",
|
| 264 |
+
"mlProgramOperationTypeHistogram" : {
|
| 265 |
+
"Ios18.expandDims" : 69,
|
| 266 |
+
"Ios18.mul" : 194,
|
| 267 |
+
"Ios18.cos" : 1,
|
| 268 |
+
"Ios18.softmax" : 16,
|
| 269 |
+
"Ios18.matmul" : 33,
|
| 270 |
+
"Ios18.rsqrt" : 33,
|
| 271 |
+
"Identity" : 2,
|
| 272 |
+
"Ios16.reduceMean" : 33,
|
| 273 |
+
"Ios18.sin" : 1,
|
| 274 |
+
"Split" : 16,
|
| 275 |
+
"Select" : 1,
|
| 276 |
+
"Tile" : 32,
|
| 277 |
+
"Ios18.add" : 113,
|
| 278 |
+
"Ios16.fillLike" : 1,
|
| 279 |
+
"Ios18.sliceUpdate" : 32,
|
| 280 |
+
"Ios18.reshape" : 99,
|
| 281 |
+
"Ios18.constexprLutToDense" : 97,
|
| 282 |
+
"Ios18.conv" : 96,
|
| 283 |
+
"Ios18.concat" : 65,
|
| 284 |
+
"Ios18.cast" : 1,
|
| 285 |
+
"Ios18.transpose" : 18,
|
| 286 |
+
"Ios18.pow" : 33,
|
| 287 |
+
"Ios18.silu" : 16,
|
| 288 |
+
"Ios18.lessEqual" : 1,
|
| 289 |
+
"Ios18.sliceByIndex" : 160,
|
| 290 |
+
"Ios18.squeeze" : 16
|
| 291 |
+
},
|
| 292 |
+
"shortDescription" : "Anemll Model: Multifunction Combined",
|
| 293 |
+
"generatedClassName" : "phi4_FFN_PF_lut4_chunk_02of02",
|
| 294 |
+
"author" : "Converted with Anemll v0.3.4",
|
| 295 |
+
"modelType" : {
|
| 296 |
+
"name" : "MLModelType_mlProgram"
|
| 297 |
+
}
|
| 298 |
+
}
|
| 299 |
+
]
|
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/model.mil
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
phi4_FFN_PF_lut4_chunk_02of02.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7cddf51a23eccf8537aff0f49164d219a60b12dcfabab1a51b297eed9104d0d
|
| 3 |
+
size 942252864
|
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0deac5f27f9d44bdea9ad7c01884078b050749a8a146535c70762679ac9f04de
|
| 3 |
+
size 947140
|
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7cddf51a23eccf8537aff0f49164d219a60b12dcfabab1a51b297eed9104d0d
|
| 3 |
+
size 942252864
|
phi4_FFN_PF_lut4_chunk_02of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"30CD2E36-07C5-46C1-A067-C7AF3DF75B14": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"4B6D69A1-DA28-4E09-B239-28E2E3CAD832": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "30CD2E36-07C5-46C1-A067-C7AF3DF75B14"
|
| 18 |
+
}
|
phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:586eb631c94781bc7fb29b0dba9f94aed96c38cc9886abc87e283e62fb597837
|
| 3 |
+
size 465885
|
phi4_FFN_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ce2dab2f6ca3968850368574439596cbc90af797aa8b887ad7bf556c3975c27
|
| 3 |
+
size 941536064
|
phi4_FFN_lut4_chunk_01of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"10C45FAA-C192-4B04-A068-94CC88D24529": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"CD944379-EDFB-49EF-BF36-AD1F74C8E637": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "10C45FAA-C192-4B04-A068-94CC88D24529"
|
| 18 |
+
}
|
phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01da65b3bc03491a84d0f48d5de5ad0355492b8d176244ce4fcf65f5b128ebe4
|
| 3 |
+
size 466038
|
phi4_FFN_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4b93c86e74522162838912ec96960a71fb56953b9a9cc173fe9d2f02b93938e
|
| 3 |
+
size 941536064
|
phi4_FFN_lut4_chunk_02of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"07A9AE1F-BD5F-43F9-9786-BF4AD9AA7067": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"9335DBFF-822F-4875-917B-186684CE3051": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "07A9AE1F-BD5F-43F9-9786-BF4AD9AA7067"
|
| 18 |
+
}
|
phi4_embeddings_lut8.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3c9e2c0ee2c9a3a599d109ae298f4474e53fba48d154a57b4a84513f70c6f0a
|
| 3 |
+
size 243
|
phi4_embeddings_lut8.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc923709421bf358759efcb64df7f19bf8e30bcfbf8aa0dc878c7fa229cf4b6c
|
| 3 |
+
size 383
|
phi4_embeddings_lut8.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,65 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"storagePrecision" : "Mixed (Float16, Palettized (23 bits), UInt8)",
|
| 5 |
+
"outputSchema" : [
|
| 6 |
+
{
|
| 7 |
+
"hasShapeFlexibility" : "0",
|
| 8 |
+
"isOptional" : "0",
|
| 9 |
+
"dataType" : "Float16",
|
| 10 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 11 |
+
"shortDescription" : "",
|
| 12 |
+
"shape" : "[1, 1, 3072]",
|
| 13 |
+
"name" : "hidden_states",
|
| 14 |
+
"type" : "MultiArray"
|
| 15 |
+
}
|
| 16 |
+
],
|
| 17 |
+
"modelParameters" : [
|
| 18 |
+
|
| 19 |
+
],
|
| 20 |
+
"specificationVersion" : 9,
|
| 21 |
+
"mlProgramOperationTypeHistogram" : {
|
| 22 |
+
"Ios18.greaterEqual" : 2,
|
| 23 |
+
"Ios18.constexprLutToDense" : 1,
|
| 24 |
+
"Ios18.add" : 2,
|
| 25 |
+
"Select" : 2,
|
| 26 |
+
"Ios18.gather" : 1
|
| 27 |
+
},
|
| 28 |
+
"computePrecision" : "Mixed (Float16, Int32)",
|
| 29 |
+
"isUpdatable" : "0",
|
| 30 |
+
"stateSchema" : [
|
| 31 |
+
|
| 32 |
+
],
|
| 33 |
+
"availability" : {
|
| 34 |
+
"macOS" : "15.0",
|
| 35 |
+
"tvOS" : "18.0",
|
| 36 |
+
"visionOS" : "2.0",
|
| 37 |
+
"watchOS" : "11.0",
|
| 38 |
+
"iOS" : "18.0",
|
| 39 |
+
"macCatalyst" : "18.0"
|
| 40 |
+
},
|
| 41 |
+
"modelType" : {
|
| 42 |
+
"name" : "MLModelType_mlProgram"
|
| 43 |
+
},
|
| 44 |
+
"userDefinedMetadata" : {
|
| 45 |
+
"com.github.apple.coremltools.conversion_date" : "2025-09-28",
|
| 46 |
+
"com.github.apple.coremltools.source" : "torch==2.8.0",
|
| 47 |
+
"com.github.apple.coremltools.version" : "9.0b1",
|
| 48 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 49 |
+
},
|
| 50 |
+
"inputSchema" : [
|
| 51 |
+
{
|
| 52 |
+
"hasShapeFlexibility" : "0",
|
| 53 |
+
"isOptional" : "0",
|
| 54 |
+
"dataType" : "Int32",
|
| 55 |
+
"formattedType" : "MultiArray (Int32 1 × 1)",
|
| 56 |
+
"shortDescription" : "",
|
| 57 |
+
"shape" : "[1, 1]",
|
| 58 |
+
"name" : "input_ids",
|
| 59 |
+
"type" : "MultiArray"
|
| 60 |
+
}
|
| 61 |
+
],
|
| 62 |
+
"generatedClassName" : "phi4_embeddings_lut8",
|
| 63 |
+
"method" : "predict"
|
| 64 |
+
}
|
| 65 |
+
]
|
phi4_embeddings_lut8.mlmodelc/model.mil
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
program(1.3)
|
| 2 |
+
[buildInfo = dict<string, string>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}})]
|
| 3 |
+
{
|
| 4 |
+
func main<ios18>(tensor<int32, [1, 1]> input_ids) {
|
| 5 |
+
int32 var_6_batch_dims_0 = const()[name = string("op_6_batch_dims_0"), val = int32(0)];
|
| 6 |
+
bool var_6_validate_indices_0 = const()[name = string("op_6_validate_indices_0"), val = bool(false)];
|
| 7 |
+
tensor<fp16, [200064, 3072]> embed_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint8, [200064, 3072]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor<fp16, [25008, 1, 256, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(614596736))))[name = string("embed_weight_to_fp16_palettized")];
|
| 8 |
+
int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)];
|
| 9 |
+
tensor<bool, [1, 1]> greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = string("greater_equal_0")];
|
| 10 |
+
int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(200064)];
|
| 11 |
+
tensor<int32, [1, 1]> add_0 = add(x = input_ids, y = slice_by_index_0)[name = string("add_0")];
|
| 12 |
+
tensor<int32, [1, 1]> select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = string("select_0")];
|
| 13 |
+
int32 greater_equal_0_y_0_1 = const()[name = string("greater_equal_0_y_0_1"), val = int32(0)];
|
| 14 |
+
tensor<bool, [1, 1]> greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = string("greater_equal_0_1")];
|
| 15 |
+
int32 slice_by_index_0_1 = const()[name = string("slice_by_index_0_1"), val = int32(200064)];
|
| 16 |
+
tensor<int32, [1, 1]> add_0_1 = add(x = select_0, y = slice_by_index_0_1)[name = string("add_0_1")];
|
| 17 |
+
tensor<int32, [1, 1]> select_0_1 = select(a = select_0, b = add_0_1, cond = greater_equal_0_1)[name = string("select_0_1")];
|
| 18 |
+
int32 op_6_cast_fp16_axis_0 = const()[name = string("op_6_cast_fp16_axis_0"), val = int32(0)];
|
| 19 |
+
tensor<fp16, [1, 1, 3072]> hidden_states = gather(axis = op_6_cast_fp16_axis_0, batch_dims = var_6_batch_dims_0, indices = select_0_1, validate_indices = var_6_validate_indices_0, x = embed_weight_to_fp16_palettized)[name = string("op_6_cast_fp16")];
|
| 20 |
+
} -> (hidden_states);
|
| 21 |
+
}
|
phi4_embeddings_lut8.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:471ccac8a8d66e8f8a024ce8b98f037dd31fa3bac450fdb53f1c8e3308ee011a
|
| 3 |
+
size 627400896
|
phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:92af5fae585670c8e37cafbf73971a02bd75b8c102ec6ab9af0aaa723aa672b0
|
| 3 |
+
size 2526
|
phi4_embeddings_lut8.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:471ccac8a8d66e8f8a024ce8b98f037dd31fa3bac450fdb53f1c8e3308ee011a
|
| 3 |
+
size 627400896
|
phi4_embeddings_lut8.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"61B24E7A-D867-4391-A38F-50F28BF7D5FD": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"7BCAECDE-96CA-47ED-ABB9-3F6559A9D4F4": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "61B24E7A-D867-4391-A38F-50F28BF7D5FD"
|
| 18 |
+
}
|
phi4_lm_head_lut6.mlmodelc/analytics/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d17ebd64d18ae52309635d5106ef6270ad518ededa11856b6c50bdc201c68e2
|
| 3 |
+
size 243
|
phi4_lm_head_lut6.mlmodelc/coremldata.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22a2a16ffd4f1e687322b91095caa994c6a27c2b1616dc92ec3f3f5a429895c1
|
| 3 |
+
size 383
|
phi4_lm_head_lut6.mlmodelc/metadata.json
ADDED
|
@@ -0,0 +1,63 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"metadataOutputVersion" : "3.0",
|
| 4 |
+
"storagePrecision" : "Mixed (Float16, Palettized (21 bits), UInt6)",
|
| 5 |
+
"outputSchema" : [
|
| 6 |
+
{
|
| 7 |
+
"hasShapeFlexibility" : "0",
|
| 8 |
+
"isOptional" : "0",
|
| 9 |
+
"dataType" : "Float16",
|
| 10 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 200064)",
|
| 11 |
+
"shortDescription" : "",
|
| 12 |
+
"shape" : "[1, 1, 200064]",
|
| 13 |
+
"name" : "logits",
|
| 14 |
+
"type" : "MultiArray"
|
| 15 |
+
}
|
| 16 |
+
],
|
| 17 |
+
"modelParameters" : [
|
| 18 |
+
|
| 19 |
+
],
|
| 20 |
+
"specificationVersion" : 9,
|
| 21 |
+
"mlProgramOperationTypeHistogram" : {
|
| 22 |
+
"Ios18.constexprLutToDense" : 1,
|
| 23 |
+
"Ios18.transpose" : 2,
|
| 24 |
+
"Ios18.conv" : 1
|
| 25 |
+
},
|
| 26 |
+
"computePrecision" : "Mixed (Float16, Int32)",
|
| 27 |
+
"isUpdatable" : "0",
|
| 28 |
+
"stateSchema" : [
|
| 29 |
+
|
| 30 |
+
],
|
| 31 |
+
"availability" : {
|
| 32 |
+
"macOS" : "15.0",
|
| 33 |
+
"tvOS" : "18.0",
|
| 34 |
+
"visionOS" : "2.0",
|
| 35 |
+
"watchOS" : "11.0",
|
| 36 |
+
"iOS" : "18.0",
|
| 37 |
+
"macCatalyst" : "18.0"
|
| 38 |
+
},
|
| 39 |
+
"modelType" : {
|
| 40 |
+
"name" : "MLModelType_mlProgram"
|
| 41 |
+
},
|
| 42 |
+
"userDefinedMetadata" : {
|
| 43 |
+
"com.github.apple.coremltools.conversion_date" : "2025-09-28",
|
| 44 |
+
"com.github.apple.coremltools.source" : "torch==2.8.0",
|
| 45 |
+
"com.github.apple.coremltools.version" : "9.0b1",
|
| 46 |
+
"com.github.apple.coremltools.source_dialect" : "TorchScript"
|
| 47 |
+
},
|
| 48 |
+
"inputSchema" : [
|
| 49 |
+
{
|
| 50 |
+
"hasShapeFlexibility" : "0",
|
| 51 |
+
"isOptional" : "0",
|
| 52 |
+
"dataType" : "Float16",
|
| 53 |
+
"formattedType" : "MultiArray (Float16 1 × 1 × 3072)",
|
| 54 |
+
"shortDescription" : "",
|
| 55 |
+
"shape" : "[1, 1, 3072]",
|
| 56 |
+
"name" : "hidden_states",
|
| 57 |
+
"type" : "MultiArray"
|
| 58 |
+
}
|
| 59 |
+
],
|
| 60 |
+
"generatedClassName" : "phi4_lm_head_lut6",
|
| 61 |
+
"method" : "predict"
|
| 62 |
+
}
|
| 63 |
+
]
|
phi4_lm_head_lut6.mlmodelc/model.mil
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
program(1.3)
|
| 2 |
+
[buildInfo = dict<string, string>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}})]
|
| 3 |
+
{
|
| 4 |
+
func main<ios18>(tensor<fp16, [1, 1, 3072]> hidden_states) {
|
| 5 |
+
tensor<int32, [3]> var_6 = const()[name = string("op_6"), val = tensor<int32, [3]>([0, 2, 1])];
|
| 6 |
+
string var_22_pad_type_0 = const()[name = string("op_22_pad_type_0"), val = string("valid")];
|
| 7 |
+
int32 var_22_groups_0 = const()[name = string("op_22_groups_0"), val = int32(1)];
|
| 8 |
+
tensor<int32, [1]> var_22_strides_0 = const()[name = string("op_22_strides_0"), val = tensor<int32, [1]>([1])];
|
| 9 |
+
tensor<int32, [2]> var_22_pad_0 = const()[name = string("op_22_pad_0"), val = tensor<int32, [2]>([0, 0])];
|
| 10 |
+
tensor<int32, [1]> var_22_dilations_0 = const()[name = string("op_22_dilations_0"), val = tensor<int32, [1]>([1])];
|
| 11 |
+
tensor<fp16, [200064, 3072, 1]> squeeze_0_cast_fp16_to_fp32_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor<uint6, [200064, 3072, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor<fp16, [25008, 1, 1, 64, 1]>(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(460947584))))[name = string("squeeze_0_cast_fp16_to_fp32_to_fp16_palettized")];
|
| 12 |
+
tensor<fp16, [1, 3072, 1]> var_7_cast_fp16 = transpose(perm = var_6, x = hidden_states)[name = string("transpose_1")];
|
| 13 |
+
tensor<fp16, [1, 200064, 1]> var_22_cast_fp16 = conv(dilations = var_22_dilations_0, groups = var_22_groups_0, pad = var_22_pad_0, pad_type = var_22_pad_type_0, strides = var_22_strides_0, weight = squeeze_0_cast_fp16_to_fp32_to_fp16_palettized, x = var_7_cast_fp16)[name = string("op_22_cast_fp16")];
|
| 14 |
+
tensor<int32, [3]> var_26 = const()[name = string("op_26"), val = tensor<int32, [3]>([0, 2, 1])];
|
| 15 |
+
tensor<fp16, [1, 1, 200064]> logits = transpose(perm = var_26, x = var_22_cast_fp16)[name = string("transpose_0")];
|
| 16 |
+
} -> (logits);
|
| 17 |
+
}
|
phi4_lm_head_lut6.mlmodelc/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1620b615ef8cd96a1087ca6fba635eebcc22398c4174ad45ef18dde785d365a
|
| 3 |
+
size 464148672
|
phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e7803878a76f9ada016ee6d8016448971188293a7ae6694eedc1d4ef86fb583
|
| 3 |
+
size 2080
|
phi4_lm_head_lut6.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1620b615ef8cd96a1087ca6fba635eebcc22398c4174ad45ef18dde785d365a
|
| 3 |
+
size 464148672
|
phi4_lm_head_lut6.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"3528B6F8-359A-47AB-9099-3E9C4121A65A": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"5C3068C5-09B3-469D-9E30-D89DCD3242BA": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "5C3068C5-09B3-469D-9E30-D89DCD3242BA"
|
| 18 |
+
}
|
phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c7dffe2693f54d774fd943549a8029ebf7997991bb633be036c3761b5e97f3f
|
| 3 |
+
size 481032
|
phi4_prefill_lut4_chunk_01of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea0e5d1ec01f7d0a8c55c98384c211456ab42d35799ed274e3787bb86cf1d1b8
|
| 3 |
+
size 942029504
|
phi4_prefill_lut4_chunk_01of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"CF8A09C1-D506-45BD-80A3-4E36C2529334": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Weights",
|
| 7 |
+
"name": "weights",
|
| 8 |
+
"path": "com.apple.CoreML/weights"
|
| 9 |
+
},
|
| 10 |
+
"DA5F8CFD-5833-43DD-A9BD-0981D832D125": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Specification",
|
| 13 |
+
"name": "model.mlmodel",
|
| 14 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "DA5F8CFD-5833-43DD-A9BD-0981D832D125"
|
| 18 |
+
}
|
phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/model.mlmodel
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e0b8e9e132180bed768bc88e6aaa4a2056a0a6506815caf8d1090b1e6becd1f
|
| 3 |
+
size 481242
|
phi4_prefill_lut4_chunk_02of02.mlpackage/Data/com.apple.CoreML/weights/weight.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7344a9ff4bcc5c1e124c7e110973d957cd6ddeafc603e9701b684076678969d4
|
| 3 |
+
size 942029504
|
phi4_prefill_lut4_chunk_02of02.mlpackage/Manifest.json
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"fileFormatVersion": "1.0.0",
|
| 3 |
+
"itemInfoEntries": {
|
| 4 |
+
"05D6FC91-3A2E-4B17-975D-AF311B32C225": {
|
| 5 |
+
"author": "com.apple.CoreML",
|
| 6 |
+
"description": "CoreML Model Specification",
|
| 7 |
+
"name": "model.mlmodel",
|
| 8 |
+
"path": "com.apple.CoreML/model.mlmodel"
|
| 9 |
+
},
|
| 10 |
+
"A203C972-22D7-4829-B187-257027B2E637": {
|
| 11 |
+
"author": "com.apple.CoreML",
|
| 12 |
+
"description": "CoreML Model Weights",
|
| 13 |
+
"name": "weights",
|
| 14 |
+
"path": "com.apple.CoreML/weights"
|
| 15 |
+
}
|
| 16 |
+
},
|
| 17 |
+
"rootModelIdentifier": "05D6FC91-3A2E-4B17-975D-AF311B32C225"
|
| 18 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:382cc235b56c725945e149cc25f191da667c836655efd0857b004320e90e91ea
|
| 3 |
+
size 15524095
|