| [ | |
| { | |
| "metadataOutputVersion" : "3.0", | |
| "storagePrecision" : "Float16", | |
| "outputSchema" : [ | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 1 × 1920)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 1, 1920]", | |
| "name" : "var_1445", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 512 × 16)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 512, 16]", | |
| "name" : "y_end_1", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 2 × 1 × 8 × 256 × 64)", | |
| "shortDescription" : "", | |
| "shape" : "[2, 1, 8, 256, 64]", | |
| "name" : "new_cache_1_internal_tensor_assign_2", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_402", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "new_end_offset_1", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 2 × 1 × 8 × 256 × 64)", | |
| "shortDescription" : "", | |
| "shape" : "[2, 1, 8, 256, 64]", | |
| "name" : "new_cache_internal_tensor_assign_2", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_825", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "new_end_offset", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 512 × 6)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 512, 6]", | |
| "name" : "var_998", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1006", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 256 × 6)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 256, 6]", | |
| "name" : "var_1048", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 256 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 256, 2]", | |
| "name" : "var_1105", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1113", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1134", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 128 × 5)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 128, 5]", | |
| "name" : "var_1178", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 128 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 128, 2]", | |
| "name" : "var_1235", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1243", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1264", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 4)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 4]", | |
| "name" : "var_1308", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 2]", | |
| "name" : "var_1365", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1373", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1394", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 2]", | |
| "name" : "var_1450", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "var_1458", | |
| "type" : "MultiArray" | |
| } | |
| ], | |
| "modelParameters" : [ | |
| ], | |
| "specificationVersion" : 7, | |
| "mlProgramOperationTypeHistogram" : { | |
| "Transpose" : 10, | |
| "Ios16.elu" : 10, | |
| "Ios16.scatterAlongAxis" : 4, | |
| "Ios16.softmax" : 2, | |
| "Ios16.sin" : 2, | |
| "Identity" : 3, | |
| "Ios16.linear" : 8, | |
| "Ios16.add" : 29, | |
| "Concat" : 9, | |
| "Ios16.convTranspose" : 4, | |
| "Tile" : 12, | |
| "Select" : 9, | |
| "Ios16.greaterEqual" : 6, | |
| "Ios16.logicalAnd" : 4, | |
| "Ios16.fillLike" : 2, | |
| "Ios16.greater" : 5, | |
| "Ios16.lessEqual" : 2, | |
| "ExpandDims" : 8, | |
| "Ios16.sub" : 21, | |
| "Ios16.cast" : 4, | |
| "Ios16.reshape" : 37, | |
| "Ios16.less" : 2, | |
| "Ios16.matmul" : 4, | |
| "Ios16.layerNorm" : 4, | |
| "SliceByIndex" : 43, | |
| "Stack" : 4, | |
| "Ios16.scatter" : 4, | |
| "Ios16.floor" : 4, | |
| "Ios16.gelu" : 2, | |
| "Ios16.mul" : 34, | |
| "Ios16.cos" : 2, | |
| "Ios16.conv" : 8 | |
| }, | |
| "computePrecision" : "Mixed (Float16, Int32)", | |
| "isUpdatable" : "0", | |
| "stateSchema" : [ | |
| ], | |
| "availability" : { | |
| "macOS" : "13.0", | |
| "tvOS" : "16.0", | |
| "visionOS" : "1.0", | |
| "watchOS" : "9.0", | |
| "iOS" : "16.0", | |
| "macCatalyst" : "16.0" | |
| }, | |
| "modelType" : { | |
| "name" : "MLModelType_mlProgram" | |
| }, | |
| "userDefinedMetadata" : { | |
| "com.github.apple.coremltools.conversion_date" : "2026-01-28", | |
| "com.github.apple.coremltools.source" : "torch==2.10.0", | |
| "com.github.apple.coremltools.version" : "9.0", | |
| "com.github.apple.coremltools.source_dialect" : "TorchScript" | |
| }, | |
| "inputSchema" : [ | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 512 × 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 512, 1]", | |
| "name" : "latent", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 512 × 16)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 512, 16]", | |
| "name" : "upsample_partial", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 2 × 1 × 8 × 256 × 64)", | |
| "shortDescription" : "", | |
| "shape" : "[2, 1, 8, 256, 64]", | |
| "name" : "attn0_cache", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "attn0_offset", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "attn0_end_offset", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 2 × 1 × 8 × 256 × 64)", | |
| "shortDescription" : "", | |
| "shape" : "[2, 1, 8, 256, 64]", | |
| "name" : "attn1_cache", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "attn1_offset", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "attn1_end_offset", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 512 × 6)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 512, 6]", | |
| "name" : "conv0_prev", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "conv0_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 256 × 6)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 256, 6]", | |
| "name" : "convtr0_partial", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 256 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 256, 2]", | |
| "name" : "res0_conv0_prev", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res0_conv0_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res0_conv1_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 128 × 5)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 128, 5]", | |
| "name" : "convtr1_partial", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 128 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 128, 2]", | |
| "name" : "res1_conv0_prev", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res1_conv0_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res1_conv1_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 4)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 4]", | |
| "name" : "convtr2_partial", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 2]", | |
| "name" : "res2_conv0_prev", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res2_conv0_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "res2_conv1_first", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1 × 64 × 2)", | |
| "shortDescription" : "", | |
| "shape" : "[1, 64, 2]", | |
| "name" : "conv_final_prev", | |
| "type" : "MultiArray" | |
| }, | |
| { | |
| "hasShapeFlexibility" : "0", | |
| "isOptional" : "0", | |
| "dataType" : "Float16", | |
| "formattedType" : "MultiArray (Float16 1)", | |
| "shortDescription" : "", | |
| "shape" : "[1]", | |
| "name" : "conv_final_first", | |
| "type" : "MultiArray" | |
| } | |
| ], | |
| "generatedClassName" : "mimi_decoder_v3", | |
| "method" : "predict" | |
| } | |
| ] |