{ "bizCode": "MNNTest", "extraInfo": { "version": "3.4.0" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 2560 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 4 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 126 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 32, 2, 1, -1, 4, 128 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "past_key_values", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 3 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "Reshape", "main": { "dims": [ -1 ] , "dimType": "NCHW" } , "name": "presents", "outputIndexes": [ 1 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 2560 ] } , "name": "/blocks.0/Constant_output_0", "outputIndexes": [ 5 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/Reshape_output_0", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 0, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": [ 7 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2899 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2900 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20480, 3276822, 819200, 0, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 2901 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2902 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2902 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 8 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": [ 9 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Shape51", "outputIndexes": [ 10 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Rank53", "outputIndexes": [ 11 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 11, 11 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp55", "outputIndexes": [ 12 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze56", "outputIndexes": [ 13 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const9", "outputIndexes": [ 14 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp58", "outputIndexes": [ 15 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze59", "outputIndexes": [ 16 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze61", "outputIndexes": [ 17 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 13, 16, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice62", "outputIndexes": [ 18 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 18 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze63", "outputIndexes": [ 19 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 19 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp65", "outputIndexes": [ 20 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 20, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": [ 21 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_4_output_0", "outputIndexes": [ 22 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze75", "outputIndexes": [ 24 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze78", "outputIndexes": [ 25 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 24, 25, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice81", "outputIndexes": [ 26 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze82", "outputIndexes": [ 27 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 27 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp83", "outputIndexes": [ 28 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 27 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp84", "outputIndexes": [ 29 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 29, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": [ 30 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 31 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 20 ] } , "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": [ 32 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 128 ] } , "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": [ 33 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 23, 31, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": [ 34 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 34 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": [ 35 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 36 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 2 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1, 1 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 37 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 36, 37 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/rotary/Reshape_output_0", "outputIndexes": [ 38 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 64 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.865964, 0.749894, 0.649382, 0.562341, 0.486968, 0.421697, 0.365174, 0.316228, 0.273842, 0.237137, 0.205353, 0.177828, 0.153993, 0.133352, 0.115478, 0.1, 0.086596, 0.074989, 0.064938, 0.056234, 0.048697, 0.04217, 0.036517, 0.031623, 0.027384, 0.023714, 0.020535, 0.017783, 0.015399, 0.013335, 0.011548, 0.01, 0.00866, 0.007499, 0.006494, 0.005623, 0.00487, 0.004217, 0.003652, 0.003162, 0.002738, 0.002371, 0.002054, 0.001778, 0.00154, 0.001334, 0.001155, 0.001, 0.000866, 0.00075, 0.000649, 0.000562, 0.000487, 0.000422, 0.000365, 0.000316, 0.000274, 0.000237, 0.000205, 0.000178, 0.000154, 0.000133, 0.000115 ] } , "name": "/rotary/Constant_2_output_0", "outputIndexes": [ 39 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38, 39 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 40 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 41 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 42 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 43 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 44 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42, 44 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 45 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45, 45 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 46 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_7_output_0", "outputIndexes": [ 47 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 46, 47 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 48 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 17 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 49 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49 ] , "main_type": "NONE", "name": "Shape107", "outputIndexes": [ 50 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 49 ] , "main_type": "NONE", "name": "Rank109", "outputIndexes": [ 51 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51, 51 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp111", "outputIndexes": [ 52 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze112", "outputIndexes": [ 53 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp114", "outputIndexes": [ 54 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze115", "outputIndexes": [ 55 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 53, 55, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice118", "outputIndexes": [ 56 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze119", "outputIndexes": [ 57 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 57, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp121", "outputIndexes": [ 58 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 58, 52 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": [ 59 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": [ 60 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": [ 61 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_10_output_0", "outputIndexes": [ 62 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61 ] , "main_type": "NONE", "name": "Shape239", "outputIndexes": [ 63 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 61 ] , "main_type": "NONE", "name": "Rank241", "outputIndexes": [ 64 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 64, 64 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp243", "outputIndexes": [ 65 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze244", "outputIndexes": [ 66 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp246", "outputIndexes": [ 67 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 67 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze247", "outputIndexes": [ 68 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 63, 66, 68, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice250", "outputIndexes": [ 69 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze251", "outputIndexes": [ 70 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 70 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp252", "outputIndexes": [ 71 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 71, 70 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp253", "outputIndexes": [ 72 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 72, 65 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": [ 73 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_6_output_0", "outputIndexes": [ 74 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": [ 75 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 76 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/blocks.0/self_attn/Constant_19_output_0", "outputIndexes": [ 77 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_13_output_0", "outputIndexes": [ 78 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 76, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": [ 79 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 79 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": [ 80 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 81 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 22, 81, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": [ 82 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 80, 82 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": [ 83 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze158", "outputIndexes": [ 84 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze161", "outputIndexes": [ 85 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 84, 85, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice164", "outputIndexes": [ 86 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 86 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze165", "outputIndexes": [ 87 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 87 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp166", "outputIndexes": [ 88 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 88, 87 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp167", "outputIndexes": [ 89 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 89, 52 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": [ 90 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 83, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": [ 91 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 91 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": [ 92 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4116502, 655382, 163840, 0, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 2905 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2906 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2906 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 93 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 94 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 95 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 4 ] } , "name": "/blocks.0/self_attn/Constant_6_output_0", "outputIndexes": [ 96 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 95, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": [ 97 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 93, 97 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": [ 98 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": [ 99 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": [ 100 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 100 ] , "main_type": "NONE", "name": "Shape126", "outputIndexes": [ 101 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 100 ] , "main_type": "NONE", "name": "Rank128", "outputIndexes": [ 102 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 102, 102 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp130", "outputIndexes": [ 103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze131", "outputIndexes": [ 104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp133", "outputIndexes": [ 105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze134", "outputIndexes": [ 106 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101, 104, 106, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice137", "outputIndexes": [ 107 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 107 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze138", "outputIndexes": [ 108 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 108 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp139", "outputIndexes": [ 109 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109, 108 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp140", "outputIndexes": [ 110 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 110, 103 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": [ 111 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 111, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": [ 112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 112, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 113 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 113, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": [ 114 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 114 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": [ 115 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 112, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 116 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 22, 116, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": [ 117 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 115, 117 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": [ 118 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 118, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": [ 119 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 99, 119 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": [ 120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4935724, 655382, 163840, 0, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 2909 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2909 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2910 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2910 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 121 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 122 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 122, 123, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": [ 124 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 121, 124 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": [ 125 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 120, 125, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.0/self_attn/Reshape_7_output_0", "outputIndexes": [ 127 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2911 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2911 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2912 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 5754946, 3276822, 819200, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 2913 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2913 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2914 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2914 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 128 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 128 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_output_0", "outputIndexes": [ 129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 9850968, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 130 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 130 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2915 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2915 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2916 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9871448, 13434902, 3358720, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 2917 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2917 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2918 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2918 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 131 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": [ 132 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 26665070, 13434902, 3358720, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 2921 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2922 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2922 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 133 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 132, 133 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": [ 134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 134 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2923 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2923 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2924 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2924 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43458692, 13434902, 3358720, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 2925 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2926 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129, 135 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_1_output_0", "outputIndexes": [ 136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/Reshape_output_0", "outputIndexes": [ 137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 137 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 60252314, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": [ 138 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2927 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2927 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2928 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 60272794, 3276822, 819200, 0, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 2929 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2929 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2930 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2930 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 139 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": [ 140 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 140 ] , "main_type": "NONE", "name": "Shape484", "outputIndexes": [ 141 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 140 ] , "main_type": "NONE", "name": "Rank486", "outputIndexes": [ 142 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 142, 142 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp488", "outputIndexes": [ 143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze489", "outputIndexes": [ 144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp491", "outputIndexes": [ 145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze492", "outputIndexes": [ 146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141, 144, 146, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice495", "outputIndexes": [ 147 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze496", "outputIndexes": [ 148 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 148 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp498", "outputIndexes": [ 149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140, 149, 143 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": [ 150 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 150, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": [ 151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze506", "outputIndexes": [ 152 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze509", "outputIndexes": [ 153 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141, 152, 153, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice512", "outputIndexes": [ 154 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 154 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze513", "outputIndexes": [ 155 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 155 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp514", "outputIndexes": [ 156 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 155 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp515", "outputIndexes": [ 157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140, 157, 143 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": [ 158 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 158, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 159 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 151, 159, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": [ 160 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 160 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": [ 161 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": [ 162 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": [ 163 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 163 ] , "main_type": "NONE", "name": "Shape615", "outputIndexes": [ 164 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 163 ] , "main_type": "NONE", "name": "Rank617", "outputIndexes": [ 165 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165, 165 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp619", "outputIndexes": [ 166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 166 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze620", "outputIndexes": [ 167 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 166, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp622", "outputIndexes": [ 168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 168 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze623", "outputIndexes": [ 169 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 167, 169, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice626", "outputIndexes": [ 170 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze627", "outputIndexes": [ 171 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 171 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp628", "outputIndexes": [ 172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172, 171 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp629", "outputIndexes": [ 173 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 163, 173, 166 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": [ 174 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 174, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": [ 175 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 176 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161, 176, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": [ 177 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 177 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": [ 178 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 179 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161, 22, 179, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": [ 180 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 178, 180 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": [ 181 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 181, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": [ 182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162, 182 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": [ 183 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 64368816, 655382, 163840, 0, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 2933 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2933 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2934 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 184 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 150, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 185 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 158, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 186 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 185, 186, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": [ 187 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 184, 187 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": [ 188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": [ 189 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": [ 190 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 190 ] , "main_type": "NONE", "name": "Shape522", "outputIndexes": [ 191 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 190 ] , "main_type": "NONE", "name": "Rank524", "outputIndexes": [ 192 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 192, 192 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp526", "outputIndexes": [ 193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze527", "outputIndexes": [ 194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 193, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp529", "outputIndexes": [ 195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze530", "outputIndexes": [ 196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191, 194, 196, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice533", "outputIndexes": [ 197 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 197 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze534", "outputIndexes": [ 198 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 198 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp535", "outputIndexes": [ 199 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199, 198 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp536", "outputIndexes": [ 200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 190, 200, 193 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": [ 201 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 201, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": [ 202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 202, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 203 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 203, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": [ 204 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 204 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": [ 205 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 202, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 206 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 22, 206, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": [ 207 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 205, 207 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": [ 208 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": [ 209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 209 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": [ 210 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65188038, 655382, 163840, 0, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 2937 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2937 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2938 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2938 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 211 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 150, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 158, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 213 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 212, 213, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": [ 214 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 214 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": [ 215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 183, 210, 215, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.1/self_attn/Reshape_7_output_0", "outputIndexes": [ 216 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2939 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2939 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2940 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2940 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 66007260, 3276822, 819200, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 2941 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2941 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2942 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2942 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 217 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 137, 217 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_output_0", "outputIndexes": [ 218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 70103282, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 219 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 219 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2943 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2943 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2944 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 70123762, 13434902, 3358720, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 2945 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2945 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2946 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2946 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 220 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 220 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": [ 221 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 86917384, 13434902, 3358720, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 2949 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2949 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2950 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 222 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 221, 222 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": [ 223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 223 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2951 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2951 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2952 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2952 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103711006, 13434902, 3358720, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 2953 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2953 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2954 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 224 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218, 224 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_1_output_0", "outputIndexes": [ 225 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/Reshape_output_0", "outputIndexes": [ 226 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 226 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 120504628, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": [ 227 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2955 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2955 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2956 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 120525108, 3276822, 819200, 0, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 2957 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2957 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2958 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2958 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 228 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": [ 229 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 229 ] , "main_type": "NONE", "name": "Shape854", "outputIndexes": [ 230 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 229 ] , "main_type": "NONE", "name": "Rank856", "outputIndexes": [ 231 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 231, 231 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp858", "outputIndexes": [ 232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze859", "outputIndexes": [ 233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp861", "outputIndexes": [ 234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze862", "outputIndexes": [ 235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230, 233, 235, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice865", "outputIndexes": [ 236 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 236 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze866", "outputIndexes": [ 237 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 237 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp868", "outputIndexes": [ 238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 229, 238, 232 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": [ 239 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 239, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": [ 240 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze876", "outputIndexes": [ 241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze879", "outputIndexes": [ 242 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230, 241, 242, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice882", "outputIndexes": [ 243 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 243 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze883", "outputIndexes": [ 244 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 244 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp884", "outputIndexes": [ 245 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 244 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp885", "outputIndexes": [ 246 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 229, 246, 232 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": [ 247 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 247, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 248 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 240, 248, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": [ 249 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 249 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": [ 250 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": [ 251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": [ 252 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 252 ] , "main_type": "NONE", "name": "Shape985", "outputIndexes": [ 253 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 252 ] , "main_type": "NONE", "name": "Rank987", "outputIndexes": [ 254 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 254, 254 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp989", "outputIndexes": [ 255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze990", "outputIndexes": [ 256 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp992", "outputIndexes": [ 257 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze993", "outputIndexes": [ 258 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 256, 258, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice996", "outputIndexes": [ 259 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 259 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze997", "outputIndexes": [ 260 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 260 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp998", "outputIndexes": [ 261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 261, 260 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp999", "outputIndexes": [ 262 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 252, 262, 255 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": [ 263 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 263, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": [ 264 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 264, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 265 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 265, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": [ 266 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 266 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": [ 267 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 264, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 268 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 22, 268, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": [ 269 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 267, 269 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": [ 270 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": [ 271 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 271 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": [ 272 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 124621130, 655382, 163840, 0, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 2961 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2961 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2962 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2962 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 239, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 274 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 247, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 275 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 274, 275, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": [ 276 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 273, 276 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": [ 277 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": [ 278 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": [ 279 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 279 ] , "main_type": "NONE", "name": "Shape892", "outputIndexes": [ 280 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 279 ] , "main_type": "NONE", "name": "Rank894", "outputIndexes": [ 281 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 281, 281 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp896", "outputIndexes": [ 282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze897", "outputIndexes": [ 283 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp899", "outputIndexes": [ 284 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze900", "outputIndexes": [ 285 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280, 283, 285, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice903", "outputIndexes": [ 286 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze904", "outputIndexes": [ 287 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 287 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp905", "outputIndexes": [ 288 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288, 287 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp906", "outputIndexes": [ 289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 279, 289, 282 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": [ 290 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 290, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": [ 291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 292 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277, 292, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": [ 293 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 293 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": [ 294 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 295 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277, 22, 295, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": [ 296 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 294, 296 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": [ 297 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 297, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": [ 298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 278, 298 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": [ 299 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 125440352, 655382, 163840, 0, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 2965 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2965 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2966 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2966 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 300 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 239, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 247, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 302 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 301, 302, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": [ 303 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 300, 303 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": [ 304 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272, 299, 304, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.2/self_attn/Reshape_7_output_0", "outputIndexes": [ 305 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 305 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2967 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2968 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2968 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 126259574, 3276822, 819200, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 2969 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2969 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2970 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2970 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 306 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 226, 306 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_output_0", "outputIndexes": [ 307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 130355596, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 308 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 308 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2971 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2971 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2972 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 130376076, 13434902, 3358720, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 2973 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2973 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2974 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2974 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 309 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 309 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": [ 310 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 147169698, 13434902, 3358720, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 2977 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2977 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2978 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 311 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310, 311 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": [ 312 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 312 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2979 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2979 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2980 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 163963320, 13434902, 3358720, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 2981 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2981 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2982 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2982 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 313 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307, 313 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_1_output_0", "outputIndexes": [ 314 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/Reshape_output_0", "outputIndexes": [ 315 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 180756942, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": [ 316 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2983 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2983 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2984 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 180777422, 3276822, 819200, 0, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 2985 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2985 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2986 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2986 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 317 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": [ 318 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 318 ] , "main_type": "NONE", "name": "Shape1224", "outputIndexes": [ 319 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 318 ] , "main_type": "NONE", "name": "Rank1226", "outputIndexes": [ 320 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 320, 320 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1228", "outputIndexes": [ 321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1229", "outputIndexes": [ 322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1231", "outputIndexes": [ 323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1232", "outputIndexes": [ 324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319, 322, 324, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1235", "outputIndexes": [ 325 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 325 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1236", "outputIndexes": [ 326 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 326 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1238", "outputIndexes": [ 327 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318, 327, 321 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": [ 328 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": [ 329 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1246", "outputIndexes": [ 330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1249", "outputIndexes": [ 331 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319, 330, 331, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1252", "outputIndexes": [ 332 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 332 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1253", "outputIndexes": [ 333 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 333 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1254", "outputIndexes": [ 334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 333 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1255", "outputIndexes": [ 335 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318, 335, 321 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": [ 336 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 329, 337, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": [ 338 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 338 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": [ 339 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": [ 340 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": [ 341 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 341 ] , "main_type": "NONE", "name": "Shape1356", "outputIndexes": [ 342 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 341 ] , "main_type": "NONE", "name": "Rank1358", "outputIndexes": [ 343 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 343, 343 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1360", "outputIndexes": [ 344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 344 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1361", "outputIndexes": [ 345 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 344, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1363", "outputIndexes": [ 346 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1364", "outputIndexes": [ 347 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342, 345, 347, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1367", "outputIndexes": [ 348 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 348 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1368", "outputIndexes": [ 349 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 349 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1369", "outputIndexes": [ 350 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 350, 349 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1370", "outputIndexes": [ 351 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 341, 351, 344 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": [ 352 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 352, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": [ 353 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 353, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 354 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 354, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": [ 355 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 355 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": [ 356 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 353, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 357 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 22, 357, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": [ 358 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 356, 358 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": [ 359 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 359, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": [ 360 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 340, 360 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": [ 361 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 184873444, 655382, 163840, 0, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 2989 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2989 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2990 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 362 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 364 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 363, 364, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": [ 365 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 362, 365 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": [ 366 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": [ 367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": [ 368 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 368 ] , "main_type": "NONE", "name": "Shape1262", "outputIndexes": [ 369 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 368 ] , "main_type": "NONE", "name": "Rank1264", "outputIndexes": [ 370 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 370, 370 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1266", "outputIndexes": [ 371 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1267", "outputIndexes": [ 372 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1269", "outputIndexes": [ 373 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 373 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1270", "outputIndexes": [ 374 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369, 372, 374, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1273", "outputIndexes": [ 375 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 375 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1274", "outputIndexes": [ 376 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 376 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1275", "outputIndexes": [ 377 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 377, 376 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1276", "outputIndexes": [ 378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 378, 371 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": [ 379 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 379, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": [ 380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 381 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 381, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": [ 382 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 382 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": [ 383 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 384 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 22, 384, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": [ 385 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 383, 385 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": [ 386 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 386, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": [ 387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 367, 387 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": [ 388 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 185692666, 655382, 163840, 0, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 2993 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2993 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2994 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2994 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 389 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 390 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 391 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 390, 391, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": [ 392 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 389, 392 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": [ 393 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361, 388, 393, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.3/self_attn/Reshape_7_output_0", "outputIndexes": [ 394 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2995 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2996 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2996 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 186511888, 3276822, 819200, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 2997 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2997 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2998 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2998 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 395 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315, 395 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_output_0", "outputIndexes": [ 396 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 190607910, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 397 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2999 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2999 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3000 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3000 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 190628390, 13434902, 3358720, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 3001 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3001 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3002 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3002 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 398 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 398 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": [ 399 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3000 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 207422012, 13434902, 3358720, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 3005 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3006 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 400 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 399, 400 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": [ 401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3007 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3007 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3008 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3008 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 224215634, 13434902, 3358720, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 3009 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3010 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3010 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 402 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396, 402 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_1_output_0", "outputIndexes": [ 403 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/Reshape_output_0", "outputIndexes": [ 404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 241009256, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": [ 405 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3011 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3012 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 241029736, 3276822, 819200, 0, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 3013 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3013 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3014 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 406 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": [ 407 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 407 ] , "main_type": "NONE", "name": "Shape1595", "outputIndexes": [ 408 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 407 ] , "main_type": "NONE", "name": "Rank1597", "outputIndexes": [ 409 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 409, 409 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1599", "outputIndexes": [ 410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1600", "outputIndexes": [ 411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1602", "outputIndexes": [ 412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1603", "outputIndexes": [ 413 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408, 411, 413, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1606", "outputIndexes": [ 414 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 414 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1607", "outputIndexes": [ 415 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 415 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1609", "outputIndexes": [ 416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 407, 416, 410 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": [ 417 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": [ 418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1617", "outputIndexes": [ 419 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1620", "outputIndexes": [ 420 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408, 419, 420, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1623", "outputIndexes": [ 421 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1624", "outputIndexes": [ 422 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 422 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1625", "outputIndexes": [ 423 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 422 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1626", "outputIndexes": [ 424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 407, 424, 410 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": [ 425 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 425, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 426 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 418, 426, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": [ 427 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 406, 427 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": [ 428 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": [ 429 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": [ 430 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 430 ] , "main_type": "NONE", "name": "Shape1726", "outputIndexes": [ 431 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 430 ] , "main_type": "NONE", "name": "Rank1728", "outputIndexes": [ 432 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 432, 432 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1730", "outputIndexes": [ 433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 433 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1731", "outputIndexes": [ 434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 433, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1733", "outputIndexes": [ 435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 435 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1734", "outputIndexes": [ 436 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 434, 436, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1737", "outputIndexes": [ 437 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1738", "outputIndexes": [ 438 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 438 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1739", "outputIndexes": [ 439 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 438 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1740", "outputIndexes": [ 440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 430, 440, 433 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": [ 441 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 441, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": [ 442 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 443 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 443, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": [ 444 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": [ 445 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 446 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 22, 446, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": [ 447 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 445, 447 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": [ 448 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 448, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": [ 449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 429, 449 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": [ 450 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 245125758, 655382, 163840, 0, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 3017 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3017 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3018 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 451 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 452 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 425, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 453 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 452, 453, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": [ 454 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 451, 454 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": [ 455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": [ 456 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": [ 457 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 457 ] , "main_type": "NONE", "name": "Shape1633", "outputIndexes": [ 458 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 457 ] , "main_type": "NONE", "name": "Rank1635", "outputIndexes": [ 459 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 459, 459 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1637", "outputIndexes": [ 460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1638", "outputIndexes": [ 461 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1640", "outputIndexes": [ 462 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1641", "outputIndexes": [ 463 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458, 461, 463, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1644", "outputIndexes": [ 464 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1645", "outputIndexes": [ 465 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 465 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1646", "outputIndexes": [ 466 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 466, 465 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1647", "outputIndexes": [ 467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 457, 467, 460 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": [ 468 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 468, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": [ 469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 470 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 470, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": [ 471 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 471 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": [ 472 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 473 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 22, 473, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": [ 474 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 472, 474 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": [ 475 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 475, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": [ 476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 456, 476 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": [ 477 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 245944980, 655382, 163840, 0, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 3021 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3021 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3022 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3022 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 478 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 425, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 480 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 479, 480, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": [ 481 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478, 481 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": [ 482 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 450, 477, 482, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.4/self_attn/Reshape_7_output_0", "outputIndexes": [ 483 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3023 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3023 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3024 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3024 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 246764202, 3276822, 819200, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 3025 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3025 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3026 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 484 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404, 484 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_output_0", "outputIndexes": [ 485 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 250860224, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 486 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 486 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3027 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3027 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3028 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 250880704, 13434902, 3358720, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 3029 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3029 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3030 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3030 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 487 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": [ 488 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 267674326, 13434902, 3358720, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 3033 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3033 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3034 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 489 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 488, 489 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": [ 490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3035 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3035 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3036 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3036 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 284467948, 13434902, 3358720, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 3037 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3037 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3038 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 491 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485, 491 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_1_output_0", "outputIndexes": [ 492 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 492, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/Reshape_output_0", "outputIndexes": [ 493 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 493 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 301261570, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": [ 494 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3039 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3039 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3040 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 301282050, 3276822, 819200, 0, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 3041 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3041 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3042 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3042 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 495 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": [ 496 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 496 ] , "main_type": "NONE", "name": "Shape1965", "outputIndexes": [ 497 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 496 ] , "main_type": "NONE", "name": "Rank1967", "outputIndexes": [ 498 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498, 498 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1969", "outputIndexes": [ 499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1970", "outputIndexes": [ 500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1972", "outputIndexes": [ 501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1973", "outputIndexes": [ 502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 500, 502, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1976", "outputIndexes": [ 503 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1977", "outputIndexes": [ 504 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 504 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1979", "outputIndexes": [ 505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 505, 499 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": [ 506 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": [ 507 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1987", "outputIndexes": [ 508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1990", "outputIndexes": [ 509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 508, 509, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1993", "outputIndexes": [ 510 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1994", "outputIndexes": [ 511 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 511 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1995", "outputIndexes": [ 512 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 511 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1996", "outputIndexes": [ 513 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 513, 499 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": [ 514 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 507, 515, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": [ 516 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 516 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": [ 517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": [ 518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": [ 519 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 519 ] , "main_type": "NONE", "name": "Shape2097", "outputIndexes": [ 520 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 519 ] , "main_type": "NONE", "name": "Rank2099", "outputIndexes": [ 521 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 521, 521 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2101", "outputIndexes": [ 522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2102", "outputIndexes": [ 523 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2104", "outputIndexes": [ 524 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2105", "outputIndexes": [ 525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520, 523, 525, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2108", "outputIndexes": [ 526 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 526 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2109", "outputIndexes": [ 527 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 527 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2110", "outputIndexes": [ 528 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 528, 527 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2111", "outputIndexes": [ 529 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519, 529, 522 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": [ 530 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 530, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": [ 531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 531, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 532 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 532, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": [ 533 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 533 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": [ 534 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 531, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 535 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 22, 535, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": [ 536 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 534, 536 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": [ 537 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": [ 538 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 518, 538 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": [ 539 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 305378072, 655382, 163840, 0, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 3045 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3045 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3046 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 540 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 541 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 542 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 541, 542, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": [ 543 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 540, 543 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": [ 544 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": [ 545 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": [ 546 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 546 ] , "main_type": "NONE", "name": "Shape2003", "outputIndexes": [ 547 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 546 ] , "main_type": "NONE", "name": "Rank2005", "outputIndexes": [ 548 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 548, 548 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2007", "outputIndexes": [ 549 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2008", "outputIndexes": [ 550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2010", "outputIndexes": [ 551 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 551 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2011", "outputIndexes": [ 552 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 547, 550, 552, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2014", "outputIndexes": [ 553 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 553 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2015", "outputIndexes": [ 554 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 554 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2016", "outputIndexes": [ 555 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 555, 554 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2017", "outputIndexes": [ 556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 556, 549 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": [ 557 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 557, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": [ 558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 558, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 559 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544, 559, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": [ 560 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 560 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": [ 561 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 558, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 562 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544, 22, 562, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": [ 563 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 561, 563 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": [ 564 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 564, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": [ 565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 545, 565 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": [ 566 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 306197294, 655382, 163840, 0, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 3049 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3049 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3050 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3050 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 567 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 569 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 568, 569, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": [ 570 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 567, 570 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": [ 571 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 539, 566, 571, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.5/self_attn/Reshape_7_output_0", "outputIndexes": [ 572 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3051 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3051 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3052 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3052 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 307016516, 3276822, 819200, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 3053 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3053 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3054 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3054 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 573 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 493, 573 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_output_0", "outputIndexes": [ 574 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 311112538, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 575 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3055 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3055 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3056 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3056 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 311133018, 13434902, 3358720, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 3057 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3057 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3058 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3058 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 576 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 576 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": [ 577 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3056 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 327926640, 13434902, 3358720, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 3061 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3061 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3062 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3062 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 578 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 577, 578 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": [ 579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 579 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3063 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3063 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3064 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3064 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 344720262, 13434902, 3358720, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 3065 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3065 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3066 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 580 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574, 580 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_1_output_0", "outputIndexes": [ 581 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/Reshape_output_0", "outputIndexes": [ 582 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 582 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 361513884, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": [ 583 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3067 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3067 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3068 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 361534364, 3276822, 819200, 0, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 3069 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3069 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3070 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3070 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 584 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": [ 585 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 585 ] , "main_type": "NONE", "name": "Shape2336", "outputIndexes": [ 586 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 585 ] , "main_type": "NONE", "name": "Rank2338", "outputIndexes": [ 587 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 587, 587 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2340", "outputIndexes": [ 588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2341", "outputIndexes": [ 589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2343", "outputIndexes": [ 590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2344", "outputIndexes": [ 591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 589, 591, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2347", "outputIndexes": [ 592 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 592 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2348", "outputIndexes": [ 593 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2350", "outputIndexes": [ 594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 585, 594, 588 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": [ 595 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 595, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": [ 596 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2358", "outputIndexes": [ 597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2361", "outputIndexes": [ 598 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 597, 598, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2364", "outputIndexes": [ 599 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 599 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2365", "outputIndexes": [ 600 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 600 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2366", "outputIndexes": [ 601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 600 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2367", "outputIndexes": [ 602 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 585, 602, 588 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": [ 603 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 604 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596, 604, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": [ 605 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 605 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": [ 606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": [ 607 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": [ 608 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 608 ] , "main_type": "NONE", "name": "Shape2468", "outputIndexes": [ 609 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 608 ] , "main_type": "NONE", "name": "Rank2470", "outputIndexes": [ 610 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610, 610 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2472", "outputIndexes": [ 611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 611 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2473", "outputIndexes": [ 612 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 611, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2475", "outputIndexes": [ 613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2476", "outputIndexes": [ 614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609, 612, 614, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2479", "outputIndexes": [ 615 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 615 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2480", "outputIndexes": [ 616 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 616 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2481", "outputIndexes": [ 617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 616 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2482", "outputIndexes": [ 618 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608, 618, 611 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": [ 619 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 619, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": [ 620 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 620, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 621 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 621, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": [ 622 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 622 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": [ 623 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 620, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 624 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 22, 624, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": [ 625 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 623, 625 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": [ 626 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 626, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": [ 627 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 627 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": [ 628 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 365630386, 655382, 163840, 0, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 3073 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3074 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 595, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 630 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 631 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 631, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": [ 632 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 629, 632 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": [ 633 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": [ 634 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": [ 635 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 635 ] , "main_type": "NONE", "name": "Shape2374", "outputIndexes": [ 636 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 635 ] , "main_type": "NONE", "name": "Rank2376", "outputIndexes": [ 637 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 637, 637 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2378", "outputIndexes": [ 638 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2379", "outputIndexes": [ 639 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2381", "outputIndexes": [ 640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 640 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2382", "outputIndexes": [ 641 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636, 639, 641, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2385", "outputIndexes": [ 642 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 642 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2386", "outputIndexes": [ 643 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 643 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2387", "outputIndexes": [ 644 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644, 643 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2388", "outputIndexes": [ 645 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 645, 638 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": [ 646 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 646, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": [ 647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 647, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 648 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 648, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": [ 649 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 649 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": [ 650 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 647, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 651 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 22, 651, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": [ 652 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 650, 652 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": [ 653 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 653, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": [ 654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 634, 654 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": [ 655 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 366449608, 655382, 163840, 0, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 3077 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3077 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3078 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3078 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 656 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 595, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 658 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 657, 658, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": [ 659 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 656, 659 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": [ 660 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628, 655, 660, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.6/self_attn/Reshape_7_output_0", "outputIndexes": [ 661 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3079 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3079 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3080 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3080 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 367268830, 3276822, 819200, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 3081 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3081 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3082 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 662 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 582, 662 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_output_0", "outputIndexes": [ 663 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 371364852, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 664 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3083 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3083 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3084 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 371385332, 13434902, 3358720, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 3085 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3085 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3086 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3086 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 665 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": [ 666 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 388178954, 13434902, 3358720, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 3089 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3090 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3090 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 667 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666, 667 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": [ 668 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3091 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3091 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3092 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3092 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 404972576, 13434902, 3358720, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 3093 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3093 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3094 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663, 669 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_1_output_0", "outputIndexes": [ 670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/Reshape_output_0", "outputIndexes": [ 671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 421766198, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": [ 672 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3095 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3095 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3096 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 421786678, 3276822, 819200, 0, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 3097 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3097 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3098 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3098 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 673 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": [ 674 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 674 ] , "main_type": "NONE", "name": "Shape2707", "outputIndexes": [ 675 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 674 ] , "main_type": "NONE", "name": "Rank2709", "outputIndexes": [ 676 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 676 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2711", "outputIndexes": [ 677 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2712", "outputIndexes": [ 678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2714", "outputIndexes": [ 679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2715", "outputIndexes": [ 680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675, 678, 680, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2718", "outputIndexes": [ 681 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 681 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2719", "outputIndexes": [ 682 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 682 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2721", "outputIndexes": [ 683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674, 683, 677 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": [ 684 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": [ 685 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2729", "outputIndexes": [ 686 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2732", "outputIndexes": [ 687 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675, 686, 687, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2735", "outputIndexes": [ 688 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 688 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2736", "outputIndexes": [ 689 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 689 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2737", "outputIndexes": [ 690 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 689 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2738", "outputIndexes": [ 691 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674, 691, 677 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": [ 692 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 693 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 685, 693, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": [ 694 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 694 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": [ 695 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": [ 696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": [ 697 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 697 ] , "main_type": "NONE", "name": "Shape2839", "outputIndexes": [ 698 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 697 ] , "main_type": "NONE", "name": "Rank2841", "outputIndexes": [ 699 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699, 699 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2843", "outputIndexes": [ 700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2844", "outputIndexes": [ 701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2846", "outputIndexes": [ 702 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2847", "outputIndexes": [ 703 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698, 701, 703, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2850", "outputIndexes": [ 704 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 704 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2851", "outputIndexes": [ 705 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 705 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2852", "outputIndexes": [ 706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 706, 705 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2853", "outputIndexes": [ 707 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697, 707, 700 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": [ 708 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 708, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": [ 709 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 710 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695, 710, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": [ 711 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 711 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": [ 712 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 713 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695, 22, 713, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": [ 714 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 712, 714 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": [ 715 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 715, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": [ 716 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 696, 716 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": [ 717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 425882700, 655382, 163840, 0, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 3101 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3101 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3102 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 719 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 720 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 719, 720, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": [ 721 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 721 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": [ 722 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": [ 723 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": [ 724 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 724 ] , "main_type": "NONE", "name": "Shape2745", "outputIndexes": [ 725 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 724 ] , "main_type": "NONE", "name": "Rank2747", "outputIndexes": [ 726 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 726, 726 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2749", "outputIndexes": [ 727 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2750", "outputIndexes": [ 728 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2752", "outputIndexes": [ 729 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 729 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2753", "outputIndexes": [ 730 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725, 728, 730, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2756", "outputIndexes": [ 731 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 731 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2757", "outputIndexes": [ 732 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 732 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2758", "outputIndexes": [ 733 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 733, 732 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2759", "outputIndexes": [ 734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 724, 734, 727 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": [ 735 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 735, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": [ 736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 737 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 737, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": [ 738 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 738 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": [ 739 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 740 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 22, 740, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": [ 741 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 739, 741 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": [ 742 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 742, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": [ 743 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 743 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": [ 744 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 426701922, 655382, 163840, 0, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 3105 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3105 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3106 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3106 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 745 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 746 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 747 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 746, 747, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": [ 748 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 745, 748 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": [ 749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 717, 744, 749, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.7/self_attn/Reshape_7_output_0", "outputIndexes": [ 750 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3107 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3108 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3108 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 427521144, 3276822, 819200, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 3109 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3109 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3110 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3110 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 751 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671, 751 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_output_0", "outputIndexes": [ 752 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 431617166, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 753 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 753 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3111 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3112 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 431637646, 13434902, 3358720, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 3113 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3113 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3114 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3114 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 754 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 754 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": [ 755 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 448431268, 13434902, 3358720, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 3117 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3118 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3118 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 756 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755, 756 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": [ 757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3119 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3119 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3120 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3120 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 465224890, 13434902, 3358720, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 3121 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3121 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3122 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3122 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752, 758 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_1_output_0", "outputIndexes": [ 759 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/Reshape_output_0", "outputIndexes": [ 760 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 482018512, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": [ 761 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3123 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3123 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3124 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 482038992, 3276822, 819200, 0, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 3125 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3125 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3126 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3126 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 762 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": [ 763 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 763 ] , "main_type": "NONE", "name": "Shape3078", "outputIndexes": [ 764 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 763 ] , "main_type": "NONE", "name": "Rank3080", "outputIndexes": [ 765 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 765, 765 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3082", "outputIndexes": [ 766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3083", "outputIndexes": [ 767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3085", "outputIndexes": [ 768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 768 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3086", "outputIndexes": [ 769 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764, 767, 769, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3089", "outputIndexes": [ 770 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 770 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3090", "outputIndexes": [ 771 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 771 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3092", "outputIndexes": [ 772 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 763, 772, 766 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": [ 773 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 773, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": [ 774 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3100", "outputIndexes": [ 775 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 768 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3103", "outputIndexes": [ 776 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764, 775, 776, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3106", "outputIndexes": [ 777 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3107", "outputIndexes": [ 778 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 778 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3108", "outputIndexes": [ 779 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 778 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3109", "outputIndexes": [ 780 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 763, 780, 766 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": [ 781 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 781, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 782 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 774, 782, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": [ 783 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 783 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": [ 784 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": [ 785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": [ 786 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 786 ] , "main_type": "NONE", "name": "Shape3210", "outputIndexes": [ 787 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 786 ] , "main_type": "NONE", "name": "Rank3212", "outputIndexes": [ 788 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 788, 788 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3214", "outputIndexes": [ 789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3215", "outputIndexes": [ 790 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3217", "outputIndexes": [ 791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3218", "outputIndexes": [ 792 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787, 790, 792, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3221", "outputIndexes": [ 793 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3222", "outputIndexes": [ 794 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 794 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3223", "outputIndexes": [ 795 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 795, 794 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3224", "outputIndexes": [ 796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 786, 796, 789 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": [ 797 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 797, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": [ 798 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 799 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 799, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": [ 800 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 800 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": [ 801 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 802 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 22, 802, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": [ 803 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 801, 803 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": [ 804 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 804, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": [ 805 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 805 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": [ 806 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 486135014, 655382, 163840, 0, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 3129 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3129 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3130 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 807 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 773, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 808 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 781, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 809 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 808, 809, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": [ 810 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 807, 810 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": [ 811 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": [ 812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": [ 813 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Shape3116", "outputIndexes": [ 814 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Rank3118", "outputIndexes": [ 815 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 815, 815 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3120", "outputIndexes": [ 816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3121", "outputIndexes": [ 817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3123", "outputIndexes": [ 818 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3124", "outputIndexes": [ 819 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814, 817, 819, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3127", "outputIndexes": [ 820 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3128", "outputIndexes": [ 821 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 821 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3129", "outputIndexes": [ 822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 822, 821 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3130", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 813, 823, 816 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": [ 824 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 824, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": [ 825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 826 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 826, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": [ 827 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 827 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": [ 828 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 22, 829, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": [ 830 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 828, 830 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": [ 831 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 831, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": [ 832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 812, 832 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": [ 833 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 486954236, 655382, 163840, 0, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 3133 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3133 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3134 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3134 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 834 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 773, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 781, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 836 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 835, 836, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": [ 837 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 834, 837 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": [ 838 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 806, 833, 838, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.8/self_attn/Reshape_7_output_0", "outputIndexes": [ 839 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3135 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3136 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 487773458, 3276822, 819200, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 3137 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3138 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3138 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 840 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760, 840 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_output_0", "outputIndexes": [ 841 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 491869480, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 842 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 842 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3139 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3139 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3140 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 491889960, 13434902, 3358720, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 3141 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3141 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3142 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3142 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 843 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 843 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": [ 844 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 508683582, 13434902, 3358720, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 3145 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3145 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3146 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3146 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 844, 845 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": [ 846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 846 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3147 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3147 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3148 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3148 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 525477204, 13434902, 3358720, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 3149 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3149 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3150 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 847 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841, 847 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_1_output_0", "outputIndexes": [ 848 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/Reshape_output_0", "outputIndexes": [ 849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 542270826, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": [ 850 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3151 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3151 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3152 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 542291306, 3276822, 819200, 0, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 3153 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3153 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3154 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3154 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 851 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": [ 852 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 852 ] , "main_type": "NONE", "name": "Shape3449", "outputIndexes": [ 853 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 852 ] , "main_type": "NONE", "name": "Rank3451", "outputIndexes": [ 854 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 854, 854 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3453", "outputIndexes": [ 855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3454", "outputIndexes": [ 856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3456", "outputIndexes": [ 857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3457", "outputIndexes": [ 858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 856, 858, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3460", "outputIndexes": [ 859 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 859 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3461", "outputIndexes": [ 860 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 860 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3463", "outputIndexes": [ 861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 861, 855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": [ 862 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": [ 863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3471", "outputIndexes": [ 864 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3474", "outputIndexes": [ 865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 864, 865, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3477", "outputIndexes": [ 866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 866 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3478", "outputIndexes": [ 867 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 867 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3479", "outputIndexes": [ 868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 867 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3480", "outputIndexes": [ 869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 869, 855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": [ 870 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 871 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 863, 871, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": [ 872 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 872 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": [ 873 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": [ 874 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": [ 875 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 875 ] , "main_type": "NONE", "name": "Shape3581", "outputIndexes": [ 876 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 875 ] , "main_type": "NONE", "name": "Rank3583", "outputIndexes": [ 877 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 877, 877 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3585", "outputIndexes": [ 878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3586", "outputIndexes": [ 879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3588", "outputIndexes": [ 880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3589", "outputIndexes": [ 881 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876, 879, 881, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3592", "outputIndexes": [ 882 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3593", "outputIndexes": [ 883 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 883 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3594", "outputIndexes": [ 884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884, 883 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3595", "outputIndexes": [ 885 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 885, 878 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": [ 886 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": [ 887 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 888 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873, 888, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": [ 889 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": [ 890 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 891 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873, 22, 891, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": [ 892 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 890, 892 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": [ 893 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": [ 894 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 874, 894 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": [ 895 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 546387328, 655382, 163840, 0, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 3157 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3157 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3158 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3158 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 896 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 897 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 898 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 897, 898, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": [ 899 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 896, 899 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": [ 900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": [ 901 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": [ 902 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 902 ] , "main_type": "NONE", "name": "Shape3487", "outputIndexes": [ 903 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 902 ] , "main_type": "NONE", "name": "Rank3489", "outputIndexes": [ 904 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 904 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3491", "outputIndexes": [ 905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3492", "outputIndexes": [ 906 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 905, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3494", "outputIndexes": [ 907 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 907 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3495", "outputIndexes": [ 908 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 903, 906, 908, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3498", "outputIndexes": [ 909 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3499", "outputIndexes": [ 910 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 910 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3500", "outputIndexes": [ 911 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 910 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3501", "outputIndexes": [ 912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902, 912, 905 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": [ 913 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 913, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": [ 914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 915 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900, 915, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": [ 916 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 916 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": [ 917 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 918 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900, 22, 918, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": [ 919 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 917, 919 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": [ 920 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 920, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": [ 921 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 901, 921 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": [ 922 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 547206550, 655382, 163840, 0, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 3161 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3161 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3162 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3162 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 923 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 924 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 925 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 924, 925, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": [ 926 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 923, 926 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": [ 927 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 895, 922, 927, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.9/self_attn/Reshape_7_output_0", "outputIndexes": [ 928 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3163 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3163 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3164 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3164 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 548025772, 3276822, 819200, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 3165 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3165 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3166 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 929 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 929 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_output_0", "outputIndexes": [ 930 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 930 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 552121794, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 931 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3167 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3167 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3168 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 552142274, 13434902, 3358720, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 3169 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3169 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3170 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3170 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 932 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 932 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": [ 933 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 568935896, 13434902, 3358720, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 3173 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3173 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3174 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 934 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 933, 934 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": [ 935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 935 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3175 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3175 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3176 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3176 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 585729518, 13434902, 3358720, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 3177 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3177 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3178 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 930, 936 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_1_output_0", "outputIndexes": [ 937 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/Reshape_output_0", "outputIndexes": [ 938 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 602523140, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": [ 939 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3179 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3180 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 602543620, 3276822, 819200, 0, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 3181 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3181 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3182 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3182 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 940 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": [ 941 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 941 ] , "main_type": "NONE", "name": "Shape3820", "outputIndexes": [ 942 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 941 ] , "main_type": "NONE", "name": "Rank3822", "outputIndexes": [ 943 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 943, 943 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3824", "outputIndexes": [ 944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3825", "outputIndexes": [ 945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3827", "outputIndexes": [ 946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3828", "outputIndexes": [ 947 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 945, 947, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3831", "outputIndexes": [ 948 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 948 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3832", "outputIndexes": [ 949 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 949 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3834", "outputIndexes": [ 950 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 950, 944 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": [ 951 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 951, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": [ 952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3842", "outputIndexes": [ 953 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3845", "outputIndexes": [ 954 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 953, 954, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3848", "outputIndexes": [ 955 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3849", "outputIndexes": [ 956 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 956 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3850", "outputIndexes": [ 957 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 956 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3851", "outputIndexes": [ 958 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 958, 944 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": [ 959 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 959, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 960 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 952, 960, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": [ 961 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 961 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": [ 962 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": [ 963 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": [ 964 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 964 ] , "main_type": "NONE", "name": "Shape3952", "outputIndexes": [ 965 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 964 ] , "main_type": "NONE", "name": "Rank3954", "outputIndexes": [ 966 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 966, 966 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3956", "outputIndexes": [ 967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3957", "outputIndexes": [ 968 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3959", "outputIndexes": [ 969 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3960", "outputIndexes": [ 970 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 965, 968, 970, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3963", "outputIndexes": [ 971 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 971 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3964", "outputIndexes": [ 972 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 972 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3965", "outputIndexes": [ 973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973, 972 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3966", "outputIndexes": [ 974 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 964, 974, 967 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": [ 975 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 975, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": [ 976 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 977 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 977, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": [ 978 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 978 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": [ 979 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 980 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 22, 980, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": [ 981 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 979, 981 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": [ 982 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": [ 983 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 983 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": [ 984 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 606639642, 655382, 163840, 0, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 3185 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3185 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3186 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3186 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 985 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 951, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 986 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 959, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 987 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 986, 987, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": [ 988 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 985, 988 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": [ 989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": [ 990 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": [ 991 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 991 ] , "main_type": "NONE", "name": "Shape3858", "outputIndexes": [ 992 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 991 ] , "main_type": "NONE", "name": "Rank3860", "outputIndexes": [ 993 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 993, 993 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3862", "outputIndexes": [ 994 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3863", "outputIndexes": [ 995 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3865", "outputIndexes": [ 996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 996 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3866", "outputIndexes": [ 997 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992, 995, 997, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3869", "outputIndexes": [ 998 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 998 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3870", "outputIndexes": [ 999 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 999 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3871", "outputIndexes": [ 1000 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1000, 999 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3872", "outputIndexes": [ 1001 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991, 1001, 994 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": [ 1002 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": [ 1003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1003, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1004 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 1004, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": [ 1005 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1005 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": [ 1006 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1003, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1007 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 22, 1007, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": [ 1008 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1006, 1008 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": [ 1009 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1009, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": [ 1010 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 1010 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": [ 1011 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 607458864, 655382, 163840, 0, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 3189 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3189 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3190 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3190 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1012 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 951, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 959, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1014 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1013, 1014, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": [ 1015 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1012, 1015 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": [ 1016 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984, 1011, 1016, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.10/self_attn/Reshape_7_output_0", "outputIndexes": [ 1017 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3191 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3191 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3192 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3192 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 608278086, 3276822, 819200, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 3193 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3193 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3194 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3194 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1018 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 1018 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_output_0", "outputIndexes": [ 1019 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1019 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 612374108, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1020 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1020 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3195 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3196 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3196 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 612394588, 13434902, 3358720, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 3197 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3197 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3198 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3198 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1021 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1021 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1022 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3196 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 629188210, 13434902, 3358720, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 3201 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3201 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3202 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1023 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1022, 1023 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": [ 1024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1024 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3203 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3203 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3204 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3204 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 645981832, 13434902, 3358720, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 3205 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3205 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3206 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3206 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1025 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1019, 1025 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_1_output_0", "outputIndexes": [ 1026 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/Reshape_output_0", "outputIndexes": [ 1027 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 662775454, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1028 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3207 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3207 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3208 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3208 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 662795934, 3276822, 819200, 0, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 3209 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3209 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3210 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3210 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1029 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": [ 1030 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1030 ] , "main_type": "NONE", "name": "Shape4191", "outputIndexes": [ 1031 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1030 ] , "main_type": "NONE", "name": "Rank4193", "outputIndexes": [ 1032 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1032, 1032 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4195", "outputIndexes": [ 1033 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4196", "outputIndexes": [ 1034 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4198", "outputIndexes": [ 1035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4199", "outputIndexes": [ 1036 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 1034, 1036, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4202", "outputIndexes": [ 1037 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1037 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4203", "outputIndexes": [ 1038 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 1038 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4205", "outputIndexes": [ 1039 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030, 1039, 1033 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": [ 1040 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1041 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4213", "outputIndexes": [ 1042 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4216", "outputIndexes": [ 1043 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 1042, 1043, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4219", "outputIndexes": [ 1044 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1044 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4220", "outputIndexes": [ 1045 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1045 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4221", "outputIndexes": [ 1046 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 1045 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4222", "outputIndexes": [ 1047 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030, 1047, 1033 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": [ 1048 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1049 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1041, 1049, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": [ 1050 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029, 1050 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": [ 1051 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": [ 1052 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": [ 1053 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1053 ] , "main_type": "NONE", "name": "Shape4323", "outputIndexes": [ 1054 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1053 ] , "main_type": "NONE", "name": "Rank4325", "outputIndexes": [ 1055 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1055, 1055 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4327", "outputIndexes": [ 1056 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4328", "outputIndexes": [ 1057 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4330", "outputIndexes": [ 1058 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1058 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4331", "outputIndexes": [ 1059 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 1057, 1059, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4334", "outputIndexes": [ 1060 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1060 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4335", "outputIndexes": [ 1061 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1061 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4336", "outputIndexes": [ 1062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062, 1061 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4337", "outputIndexes": [ 1063 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1053, 1063, 1056 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": [ 1064 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1064, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": [ 1065 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1065, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1066 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 1066, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": [ 1067 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1067 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": [ 1068 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1065, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1069 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 22, 1069, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": [ 1070 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1068, 1070 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": [ 1071 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1071, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": [ 1072 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1052, 1072 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": [ 1073 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3208 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 666891956, 655382, 163840, 0, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 3213 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3213 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3214 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1074 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1075 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1076 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075, 1076, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": [ 1077 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1074, 1077 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": [ 1078 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": [ 1079 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": [ 1080 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1080 ] , "main_type": "NONE", "name": "Shape4229", "outputIndexes": [ 1081 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1080 ] , "main_type": "NONE", "name": "Rank4231", "outputIndexes": [ 1082 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1082, 1082 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4233", "outputIndexes": [ 1083 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4234", "outputIndexes": [ 1084 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4236", "outputIndexes": [ 1085 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1085 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4237", "outputIndexes": [ 1086 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081, 1084, 1086, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4240", "outputIndexes": [ 1087 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1087 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4241", "outputIndexes": [ 1088 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1088 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4242", "outputIndexes": [ 1089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1089, 1088 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4243", "outputIndexes": [ 1090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1080, 1090, 1083 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": [ 1091 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1091, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": [ 1092 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1093 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 1093, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": [ 1094 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1094 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": [ 1095 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1096 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 22, 1096, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": [ 1097 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095, 1097 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": [ 1098 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1098, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": [ 1099 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1079, 1099 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": [ 1100 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3208 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 667711178, 655382, 163840, 0, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 3217 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3217 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3218 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3218 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1101 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1103 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1102, 1103, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": [ 1104 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1101, 1104 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": [ 1105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 1100, 1105, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.11/self_attn/Reshape_7_output_0", "outputIndexes": [ 1106 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3219 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3219 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3220 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 668530400, 3276822, 819200, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 3221 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3221 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3222 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3222 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1107 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027, 1107 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_output_0", "outputIndexes": [ 1108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 672626422, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1109 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1109 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3223 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3224 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3224 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 672646902, 13434902, 3358720, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 3225 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3225 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3226 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3226 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1110 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1110 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1111 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3224 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 689440524, 13434902, 3358720, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 3229 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3230 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1112 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1111, 1112 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": [ 1113 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1113 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3231 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3231 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3232 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3232 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 706234146, 13434902, 3358720, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 3233 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3233 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3234 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1114 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108, 1114 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_1_output_0", "outputIndexes": [ 1115 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/Reshape_output_0", "outputIndexes": [ 1116 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1116 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 723027768, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1117 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3235 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3235 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3236 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 723048248, 3276822, 819200, 0, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 3237 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3237 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3238 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1118 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": [ 1119 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1119 ] , "main_type": "NONE", "name": "Shape4562", "outputIndexes": [ 1120 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1119 ] , "main_type": "NONE", "name": "Rank4564", "outputIndexes": [ 1121 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1121, 1121 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4566", "outputIndexes": [ 1122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4567", "outputIndexes": [ 1123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4569", "outputIndexes": [ 1124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4570", "outputIndexes": [ 1125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120, 1123, 1125, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4573", "outputIndexes": [ 1126 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1126 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4574", "outputIndexes": [ 1127 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 1127 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4576", "outputIndexes": [ 1128 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1119, 1128, 1122 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": [ 1129 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1130 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4584", "outputIndexes": [ 1131 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4587", "outputIndexes": [ 1132 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120, 1131, 1132, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4590", "outputIndexes": [ 1133 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4591", "outputIndexes": [ 1134 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1134 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4592", "outputIndexes": [ 1135 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 1134 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4593", "outputIndexes": [ 1136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1119, 1136, 1122 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": [ 1137 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1137, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1138 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1130, 1138, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": [ 1139 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1139 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": [ 1140 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": [ 1141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": [ 1142 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1142 ] , "main_type": "NONE", "name": "Shape4694", "outputIndexes": [ 1143 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1142 ] , "main_type": "NONE", "name": "Rank4696", "outputIndexes": [ 1144 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1144, 1144 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4698", "outputIndexes": [ 1145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4699", "outputIndexes": [ 1146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4701", "outputIndexes": [ 1147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1147 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4702", "outputIndexes": [ 1148 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143, 1146, 1148, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4705", "outputIndexes": [ 1149 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4706", "outputIndexes": [ 1150 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1150 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4707", "outputIndexes": [ 1151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1151, 1150 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4708", "outputIndexes": [ 1152 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1142, 1152, 1145 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": [ 1153 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1153, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": [ 1154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1155 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 1155, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": [ 1156 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1156 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": [ 1157 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1158 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 22, 1158, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": [ 1159 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1157, 1159 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": [ 1160 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1160, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": [ 1161 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 1161 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": [ 1162 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 727144270, 655382, 163840, 0, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 3241 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3241 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3242 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3242 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1163 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1164 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1137, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1164, 1165, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": [ 1166 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1163, 1166 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": [ 1167 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": [ 1168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": [ 1169 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1169 ] , "main_type": "NONE", "name": "Shape4600", "outputIndexes": [ 1170 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1169 ] , "main_type": "NONE", "name": "Rank4602", "outputIndexes": [ 1171 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1171, 1171 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4604", "outputIndexes": [ 1172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4605", "outputIndexes": [ 1173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4607", "outputIndexes": [ 1174 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1174 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4608", "outputIndexes": [ 1175 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170, 1173, 1175, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4611", "outputIndexes": [ 1176 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4612", "outputIndexes": [ 1177 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1177 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4613", "outputIndexes": [ 1178 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1178, 1177 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4614", "outputIndexes": [ 1179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1169, 1179, 1172 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": [ 1180 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1180, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": [ 1181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1182 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 1182, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": [ 1183 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": [ 1184 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1185 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 22, 1185, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": [ 1186 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1184, 1186 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": [ 1187 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1187, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": [ 1188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 1188 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": [ 1189 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 727963492, 655382, 163840, 0, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 3245 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3245 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3246 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3246 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1190 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1191 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1137, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1192 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1191, 1192, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": [ 1193 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1190, 1193 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": [ 1194 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1162, 1189, 1194, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.12/self_attn/Reshape_7_output_0", "outputIndexes": [ 1195 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3247 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3247 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3248 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3248 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 728782714, 3276822, 819200, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 3249 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3249 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3250 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3250 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1196 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1116, 1196 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_output_0", "outputIndexes": [ 1197 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 732878736, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1198 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1198 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3251 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3251 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3252 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 732899216, 13434902, 3358720, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 3253 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3253 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3254 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3254 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1199 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1199 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1200 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 749692838, 13434902, 3358720, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 3257 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3257 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3258 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3258 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1200, 1201 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": [ 1202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3259 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3259 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3260 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3260 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 766486460, 13434902, 3358720, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 3261 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3261 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3262 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1203 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197, 1203 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_1_output_0", "outputIndexes": [ 1204 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/Reshape_output_0", "outputIndexes": [ 1205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 783280082, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1206 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3263 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3263 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3264 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 783300562, 3276822, 819200, 0, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 3265 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3265 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3266 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3266 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1207 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": [ 1208 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1208 ] , "main_type": "NONE", "name": "Shape4933", "outputIndexes": [ 1209 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1208 ] , "main_type": "NONE", "name": "Rank4935", "outputIndexes": [ 1210 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1210, 1210 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4937", "outputIndexes": [ 1211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4938", "outputIndexes": [ 1212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4940", "outputIndexes": [ 1213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4941", "outputIndexes": [ 1214 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209, 1212, 1214, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4944", "outputIndexes": [ 1215 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1215 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4945", "outputIndexes": [ 1216 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 1216 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4947", "outputIndexes": [ 1217 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 1217, 1211 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": [ 1218 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1218, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4955", "outputIndexes": [ 1220 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4958", "outputIndexes": [ 1221 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209, 1220, 1221, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4961", "outputIndexes": [ 1222 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4962", "outputIndexes": [ 1223 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1223 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4963", "outputIndexes": [ 1224 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 1223 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4964", "outputIndexes": [ 1225 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 1225, 1211 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": [ 1226 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1226, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1227 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1219, 1227, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": [ 1228 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1228 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": [ 1229 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": [ 1230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": [ 1231 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1231 ] , "main_type": "NONE", "name": "Shape5065", "outputIndexes": [ 1232 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1231 ] , "main_type": "NONE", "name": "Rank5067", "outputIndexes": [ 1233 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1233, 1233 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5069", "outputIndexes": [ 1234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5070", "outputIndexes": [ 1235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5072", "outputIndexes": [ 1236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1236 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5073", "outputIndexes": [ 1237 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232, 1235, 1237, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5076", "outputIndexes": [ 1238 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1238 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5077", "outputIndexes": [ 1239 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1239 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5078", "outputIndexes": [ 1240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 1239 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5079", "outputIndexes": [ 1241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231, 1241, 1234 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": [ 1242 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1242, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": [ 1243 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1243, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1244 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 1244, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": [ 1245 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1245 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": [ 1246 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1243, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1247 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 22, 1247, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": [ 1248 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1246, 1248 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": [ 1249 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": [ 1250 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1230, 1250 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": [ 1251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 787396584, 655382, 163840, 0, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 3269 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3269 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3270 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1252 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1218, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1226, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1254 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1253, 1254, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": [ 1255 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1252, 1255 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": [ 1256 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": [ 1257 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": [ 1258 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1258 ] , "main_type": "NONE", "name": "Shape4971", "outputIndexes": [ 1259 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1258 ] , "main_type": "NONE", "name": "Rank4973", "outputIndexes": [ 1260 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1260, 1260 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4975", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4976", "outputIndexes": [ 1262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4978", "outputIndexes": [ 1263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4979", "outputIndexes": [ 1264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259, 1262, 1264, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4982", "outputIndexes": [ 1265 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1265 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4983", "outputIndexes": [ 1266 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1266 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4984", "outputIndexes": [ 1267 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1267, 1266 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4985", "outputIndexes": [ 1268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1268, 1261 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": [ 1269 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1269, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": [ 1270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1270, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1271 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256, 1271, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": [ 1272 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1272 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": [ 1273 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1270, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1274 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256, 22, 1274, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": [ 1275 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1273, 1275 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": [ 1276 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": [ 1277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1257, 1277 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": [ 1278 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 788215806, 655382, 163840, 0, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 3273 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3273 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3274 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3274 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1279 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1218, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1280 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1226, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1281 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1280, 1281, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": [ 1282 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1279, 1282 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": [ 1283 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1251, 1278, 1283, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.13/self_attn/Reshape_7_output_0", "outputIndexes": [ 1284 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3275 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3275 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3276 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3276 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 789035028, 3276822, 819200, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 3277 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3277 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3278 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3278 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1285 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205, 1285 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_output_0", "outputIndexes": [ 1286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 793131050, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1287 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1287 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3279 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3279 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3280 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 793151530, 13434902, 3358720, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 3281 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3281 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3282 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3282 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1288 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1288 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1289 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 809945152, 13434902, 3358720, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 3285 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3286 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1290 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1289, 1290 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": [ 1291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1291 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3287 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3287 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3288 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 826738774, 13434902, 3358720, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 3289 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3289 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3290 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1292 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286, 1292 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_1_output_0", "outputIndexes": [ 1293 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/Reshape_output_0", "outputIndexes": [ 1294 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 843532396, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1295 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3291 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3291 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3292 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 843552876, 3276822, 819200, 0, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 3293 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3294 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3294 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1296 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": [ 1297 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1297 ] , "main_type": "NONE", "name": "Shape5304", "outputIndexes": [ 1298 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1297 ] , "main_type": "NONE", "name": "Rank5306", "outputIndexes": [ 1299 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1299, 1299 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5308", "outputIndexes": [ 1300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5309", "outputIndexes": [ 1301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5311", "outputIndexes": [ 1302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1302 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5312", "outputIndexes": [ 1303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298, 1301, 1303, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5315", "outputIndexes": [ 1304 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1304 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5316", "outputIndexes": [ 1305 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 1305 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5318", "outputIndexes": [ 1306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1297, 1306, 1300 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": [ 1307 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1307, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1308 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5326", "outputIndexes": [ 1309 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1302 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5329", "outputIndexes": [ 1310 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298, 1309, 1310, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5332", "outputIndexes": [ 1311 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5333", "outputIndexes": [ 1312 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1312 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5334", "outputIndexes": [ 1313 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 1312 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5335", "outputIndexes": [ 1314 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1297, 1314, 1300 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": [ 1315 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1316 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1308, 1316, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": [ 1317 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 1317 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": [ 1318 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": [ 1319 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": [ 1320 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1320 ] , "main_type": "NONE", "name": "Shape5436", "outputIndexes": [ 1321 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1320 ] , "main_type": "NONE", "name": "Rank5438", "outputIndexes": [ 1322 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322, 1322 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5440", "outputIndexes": [ 1323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5441", "outputIndexes": [ 1324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5443", "outputIndexes": [ 1325 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1325 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5444", "outputIndexes": [ 1326 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321, 1324, 1326, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5447", "outputIndexes": [ 1327 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5448", "outputIndexes": [ 1328 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1328 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5449", "outputIndexes": [ 1329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1329, 1328 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5450", "outputIndexes": [ 1330 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320, 1330, 1323 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": [ 1331 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1331, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": [ 1332 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1332, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1333 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 1333, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": [ 1334 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1334 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": [ 1335 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1332, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1336 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 22, 1336, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": [ 1337 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 1337 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": [ 1338 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": [ 1339 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319, 1339 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": [ 1340 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 847648898, 655382, 163840, 0, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 3297 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3297 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3298 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1341 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1307, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1342 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1343 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1342, 1343, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": [ 1344 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1341, 1344 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": [ 1345 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": [ 1346 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": [ 1347 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1347 ] , "main_type": "NONE", "name": "Shape5342", "outputIndexes": [ 1348 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1347 ] , "main_type": "NONE", "name": "Rank5344", "outputIndexes": [ 1349 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1349, 1349 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5346", "outputIndexes": [ 1350 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5347", "outputIndexes": [ 1351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5349", "outputIndexes": [ 1352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5350", "outputIndexes": [ 1353 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348, 1351, 1353, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5353", "outputIndexes": [ 1354 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5354", "outputIndexes": [ 1355 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1355 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5355", "outputIndexes": [ 1356 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356, 1355 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5356", "outputIndexes": [ 1357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1347, 1357, 1350 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": [ 1358 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1358, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": [ 1359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1359, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1360 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 1360, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": [ 1361 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1361 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": [ 1362 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1359, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 22, 1363, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": [ 1364 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1362, 1364 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": [ 1365 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1365, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": [ 1366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1346, 1366 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": [ 1367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 848468120, 655382, 163840, 0, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 3301 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3301 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3302 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3302 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1368 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1307, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 1370, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": [ 1371 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1368, 1371 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": [ 1372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 1367, 1372, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.14/self_attn/Reshape_7_output_0", "outputIndexes": [ 1373 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3303 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3303 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3304 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3304 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 849287342, 3276822, 819200, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 3305 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3305 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3306 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3306 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1374 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294, 1374 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_output_0", "outputIndexes": [ 1375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 853383364, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1376 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1376 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3307 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3307 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3308 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3308 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 853403844, 13434902, 3358720, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 3309 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3309 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3310 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3310 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1377 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1378 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3308 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 870197466, 13434902, 3358720, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 3313 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3313 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3314 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3314 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1379 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378, 1379 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": [ 1380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1380 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3315 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3316 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3316 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 886991088, 13434902, 3358720, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 3317 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3317 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3318 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3318 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1381 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375, 1381 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_1_output_0", "outputIndexes": [ 1382 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/Reshape_output_0", "outputIndexes": [ 1383 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 903784710, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1384 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3319 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3319 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3320 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 903805190, 3276822, 819200, 0, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 3321 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3321 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3322 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1385 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": [ 1386 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1386 ] , "main_type": "NONE", "name": "Shape5675", "outputIndexes": [ 1387 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1386 ] , "main_type": "NONE", "name": "Rank5677", "outputIndexes": [ 1388 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1388, 1388 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5679", "outputIndexes": [ 1389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5680", "outputIndexes": [ 1390 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5682", "outputIndexes": [ 1391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5683", "outputIndexes": [ 1392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387, 1390, 1392, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5686", "outputIndexes": [ 1393 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1393 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5687", "outputIndexes": [ 1394 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 1394 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5689", "outputIndexes": [ 1395 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386, 1395, 1389 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": [ 1396 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1396, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1397 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5697", "outputIndexes": [ 1398 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5700", "outputIndexes": [ 1399 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387, 1398, 1399, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5703", "outputIndexes": [ 1400 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1400 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5704", "outputIndexes": [ 1401 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1401 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5705", "outputIndexes": [ 1402 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 1401 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5706", "outputIndexes": [ 1403 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386, 1403, 1389 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": [ 1404 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1404, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1405 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1397, 1405, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": [ 1406 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1406 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": [ 1407 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": [ 1408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": [ 1409 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1409 ] , "main_type": "NONE", "name": "Shape5807", "outputIndexes": [ 1410 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1409 ] , "main_type": "NONE", "name": "Rank5809", "outputIndexes": [ 1411 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1411, 1411 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5811", "outputIndexes": [ 1412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5812", "outputIndexes": [ 1413 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5814", "outputIndexes": [ 1414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1414 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5815", "outputIndexes": [ 1415 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 1413, 1415, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5818", "outputIndexes": [ 1416 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5819", "outputIndexes": [ 1417 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1417 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5820", "outputIndexes": [ 1418 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 1417 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5821", "outputIndexes": [ 1419 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1409, 1419, 1412 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": [ 1420 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": [ 1421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1422 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1422, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": [ 1423 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1423 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": [ 1424 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1425 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 22, 1425, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": [ 1426 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1424, 1426 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": [ 1427 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1427, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": [ 1428 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408, 1428 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": [ 1429 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 907901212, 655382, 163840, 0, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 3325 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3325 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3326 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1430 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1396, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1431 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1404, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1431, 1432, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": [ 1433 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1430, 1433 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": [ 1434 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": [ 1435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": [ 1436 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1436 ] , "main_type": "NONE", "name": "Shape5713", "outputIndexes": [ 1437 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1436 ] , "main_type": "NONE", "name": "Rank5715", "outputIndexes": [ 1438 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1438, 1438 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5717", "outputIndexes": [ 1439 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1439 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5718", "outputIndexes": [ 1440 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1439, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5720", "outputIndexes": [ 1441 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5721", "outputIndexes": [ 1442 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437, 1440, 1442, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5724", "outputIndexes": [ 1443 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1443 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5725", "outputIndexes": [ 1444 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1444 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5726", "outputIndexes": [ 1445 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 1444 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5727", "outputIndexes": [ 1446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 1446, 1439 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": [ 1447 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": [ 1448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1448, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1449 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 1449, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": [ 1450 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1450 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": [ 1451 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1448, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1452 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 22, 1452, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": [ 1453 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1451, 1453 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": [ 1454 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1454, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": [ 1455 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1435, 1455 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": [ 1456 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 908720434, 655382, 163840, 0, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 3329 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3330 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3330 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1457 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1396, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1458 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1404, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1459 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1458, 1459, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": [ 1460 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1457, 1460 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": [ 1461 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1429, 1456, 1461, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.15/self_attn/Reshape_7_output_0", "outputIndexes": [ 1462 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3331 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3332 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3332 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 909539656, 3276822, 819200, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 3333 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3333 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3334 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3334 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1463 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383, 1463 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_output_0", "outputIndexes": [ 1464 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 913635678, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1465 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1465 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3335 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3335 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3336 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 913656158, 13434902, 3358720, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 3337 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3337 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3338 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3338 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1466 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1467 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 930449780, 13434902, 3358720, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 3341 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3341 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3342 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 1468 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": [ 1469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1469 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3343 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3343 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3344 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 947243402, 13434902, 3358720, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 3345 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3345 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3346 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3346 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1470 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464, 1470 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_1_output_0", "outputIndexes": [ 1471 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/Reshape_output_0", "outputIndexes": [ 1472 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 964037024, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1473 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3347 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3347 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3348 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3348 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 964057504, 3276822, 819200, 0, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 3349 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3350 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3350 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1474 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": [ 1475 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1475 ] , "main_type": "NONE", "name": "Shape6046", "outputIndexes": [ 1476 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1475 ] , "main_type": "NONE", "name": "Rank6048", "outputIndexes": [ 1477 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1477, 1477 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6050", "outputIndexes": [ 1478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6051", "outputIndexes": [ 1479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6053", "outputIndexes": [ 1480 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1480 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6054", "outputIndexes": [ 1481 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 1479, 1481, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6057", "outputIndexes": [ 1482 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1482 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6058", "outputIndexes": [ 1483 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 1483 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6060", "outputIndexes": [ 1484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1475, 1484, 1478 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": [ 1485 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1485, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6068", "outputIndexes": [ 1487 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1480 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6071", "outputIndexes": [ 1488 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 1487, 1488, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6074", "outputIndexes": [ 1489 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1489 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6075", "outputIndexes": [ 1490 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1490 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6076", "outputIndexes": [ 1491 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 1490 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6077", "outputIndexes": [ 1492 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1475, 1492, 1478 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": [ 1493 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1493, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1494 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1486, 1494, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": [ 1495 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474, 1495 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": [ 1496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": [ 1497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": [ 1498 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1498 ] , "main_type": "NONE", "name": "Shape6178", "outputIndexes": [ 1499 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1498 ] , "main_type": "NONE", "name": "Rank6180", "outputIndexes": [ 1500 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1500, 1500 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6182", "outputIndexes": [ 1501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6183", "outputIndexes": [ 1502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6185", "outputIndexes": [ 1503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6186", "outputIndexes": [ 1504 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499, 1502, 1504, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6189", "outputIndexes": [ 1505 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1505 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6190", "outputIndexes": [ 1506 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1506 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6191", "outputIndexes": [ 1507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1507, 1506 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6192", "outputIndexes": [ 1508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1498, 1508, 1501 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": [ 1509 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1509, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": [ 1510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1511 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 1511, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": [ 1512 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1512 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": [ 1513 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1514 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 22, 1514, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": [ 1515 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 1515 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": [ 1516 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1516, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": [ 1517 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 1517 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": [ 1518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3348 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 968153526, 655382, 163840, 0, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 3353 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3353 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3354 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3354 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1519 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1485, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1520 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1493, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1520, 1521, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": [ 1522 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1519, 1522 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": [ 1523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": [ 1524 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": [ 1525 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1525 ] , "main_type": "NONE", "name": "Shape6084", "outputIndexes": [ 1526 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1525 ] , "main_type": "NONE", "name": "Rank6086", "outputIndexes": [ 1527 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527, 1527 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6088", "outputIndexes": [ 1528 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6089", "outputIndexes": [ 1529 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6091", "outputIndexes": [ 1530 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1530 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6092", "outputIndexes": [ 1531 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 1529, 1531, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6095", "outputIndexes": [ 1532 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1532 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6096", "outputIndexes": [ 1533 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1533 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6097", "outputIndexes": [ 1534 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 1533 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6098", "outputIndexes": [ 1535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1525, 1535, 1528 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": [ 1536 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1536, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": [ 1537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1538 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 1538, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": [ 1539 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1539 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": [ 1540 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1541 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 22, 1541, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": [ 1542 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540, 1542 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": [ 1543 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1543, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": [ 1544 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524, 1544 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": [ 1545 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3348 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 968972748, 655382, 163840, 0, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 3357 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3357 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3358 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3358 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1546 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1485, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1547 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1493, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1548 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 1548, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": [ 1549 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1546, 1549 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": [ 1550 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1518, 1545, 1550, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.16/self_attn/Reshape_7_output_0", "outputIndexes": [ 1551 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3359 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3359 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3360 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 969791970, 3276822, 819200, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 3361 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3361 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3362 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3362 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1552 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472, 1552 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_output_0", "outputIndexes": [ 1553 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 973887992, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1554 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1554 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3363 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3363 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3364 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 973908472, 13434902, 3358720, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 3365 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3365 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3366 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1556 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 990702094, 13434902, 3358720, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 3369 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3369 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3370 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3370 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1557 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1556, 1557 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": [ 1558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3371 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3371 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3372 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3372 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1007495716, 13434902, 3358720, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 3373 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3373 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3374 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3374 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553, 1559 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_1_output_0", "outputIndexes": [ 1560 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/Reshape_output_0", "outputIndexes": [ 1561 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1561 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1024289338, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1562 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3375 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3375 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3376 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3376 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1024309818, 3276822, 819200, 0, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 3377 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3377 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3378 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3378 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1563 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": [ 1564 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1564 ] , "main_type": "NONE", "name": "Shape6417", "outputIndexes": [ 1565 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1564 ] , "main_type": "NONE", "name": "Rank6419", "outputIndexes": [ 1566 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1566, 1566 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6421", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6422", "outputIndexes": [ 1568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6424", "outputIndexes": [ 1569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6425", "outputIndexes": [ 1570 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565, 1568, 1570, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6428", "outputIndexes": [ 1571 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1571 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6429", "outputIndexes": [ 1572 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 1572 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6431", "outputIndexes": [ 1573 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1573, 1567 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": [ 1574 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1574, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6439", "outputIndexes": [ 1576 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6442", "outputIndexes": [ 1577 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565, 1576, 1577, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6445", "outputIndexes": [ 1578 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1578 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6446", "outputIndexes": [ 1579 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1579 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6447", "outputIndexes": [ 1580 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 1579 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6448", "outputIndexes": [ 1581 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1581, 1567 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": [ 1582 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1582, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1583 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1575, 1583, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": [ 1584 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1584 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": [ 1585 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": [ 1586 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": [ 1587 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1587 ] , "main_type": "NONE", "name": "Shape6549", "outputIndexes": [ 1588 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1587 ] , "main_type": "NONE", "name": "Rank6551", "outputIndexes": [ 1589 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 1589 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6553", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6554", "outputIndexes": [ 1591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6556", "outputIndexes": [ 1592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6557", "outputIndexes": [ 1593 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588, 1591, 1593, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6560", "outputIndexes": [ 1594 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6561", "outputIndexes": [ 1595 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1595 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6562", "outputIndexes": [ 1596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596, 1595 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6563", "outputIndexes": [ 1597 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587, 1597, 1590 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": [ 1598 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1598, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": [ 1599 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1600 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 1600, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": [ 1601 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1601 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": [ 1602 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1603 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 22, 1603, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": [ 1604 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1602, 1604 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": [ 1605 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1605, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": [ 1606 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1586, 1606 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": [ 1607 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3376 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1028405840, 655382, 163840, 0, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 3381 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3381 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3382 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3382 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1608 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1574, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1609 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1582, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1610 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1609, 1610, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": [ 1611 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1608, 1611 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": [ 1612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": [ 1613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": [ 1614 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1614 ] , "main_type": "NONE", "name": "Shape6455", "outputIndexes": [ 1615 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1614 ] , "main_type": "NONE", "name": "Rank6457", "outputIndexes": [ 1616 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1616, 1616 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6459", "outputIndexes": [ 1617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6460", "outputIndexes": [ 1618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6462", "outputIndexes": [ 1619 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6463", "outputIndexes": [ 1620 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1615, 1618, 1620, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6466", "outputIndexes": [ 1621 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6467", "outputIndexes": [ 1622 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1622 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6468", "outputIndexes": [ 1623 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1623, 1622 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6469", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 1624, 1617 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": [ 1625 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1625, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": [ 1626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1627 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1627, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": [ 1628 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": [ 1629 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1630 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 22, 1630, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": [ 1631 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1629, 1631 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": [ 1632 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1632, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": [ 1633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1613, 1633 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": [ 1634 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3376 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1029225062, 655382, 163840, 0, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 3385 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3385 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3386 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1635 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1574, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1582, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1637 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1636, 1637, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": [ 1638 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635, 1638 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": [ 1639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1607, 1634, 1639, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.17/self_attn/Reshape_7_output_0", "outputIndexes": [ 1640 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3387 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3387 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3388 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3388 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1030044284, 3276822, 819200, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 3389 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3389 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3390 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3390 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1641 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1561, 1641 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_output_0", "outputIndexes": [ 1642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1642 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1034140306, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1643 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1643 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3391 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3392 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3392 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1034160786, 13434902, 3358720, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 3393 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3393 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3394 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3394 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1644 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1644 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1645 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3392 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1050954408, 13434902, 3358720, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 3397 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3397 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3398 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3398 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1645, 1646 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": [ 1647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1647 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3399 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3399 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3400 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1067748030, 13434902, 3358720, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 3401 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3401 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3402 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1642, 1648 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_1_output_0", "outputIndexes": [ 1649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/Reshape_output_0", "outputIndexes": [ 1650 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1650 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1084541652, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1651 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3403 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3403 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3404 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1084562132, 3276822, 819200, 0, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 3405 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3405 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3406 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3406 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1652 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": [ 1653 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1653 ] , "main_type": "NONE", "name": "Shape6788", "outputIndexes": [ 1654 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1653 ] , "main_type": "NONE", "name": "Rank6790", "outputIndexes": [ 1655 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1655, 1655 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6792", "outputIndexes": [ 1656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6793", "outputIndexes": [ 1657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6795", "outputIndexes": [ 1658 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6796", "outputIndexes": [ 1659 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654, 1657, 1659, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6799", "outputIndexes": [ 1660 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1660 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6800", "outputIndexes": [ 1661 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 1661 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6802", "outputIndexes": [ 1662 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1662, 1656 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": [ 1663 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1663, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1664 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6810", "outputIndexes": [ 1665 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6813", "outputIndexes": [ 1666 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654, 1665, 1666, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6816", "outputIndexes": [ 1667 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1667 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6817", "outputIndexes": [ 1668 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1668 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6818", "outputIndexes": [ 1669 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 1668 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6819", "outputIndexes": [ 1670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1670, 1656 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": [ 1671 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1671, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1672 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1664, 1672, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": [ 1673 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1673 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": [ 1674 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": [ 1675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": [ 1676 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1676 ] , "main_type": "NONE", "name": "Shape6920", "outputIndexes": [ 1677 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1676 ] , "main_type": "NONE", "name": "Rank6922", "outputIndexes": [ 1678 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1678, 1678 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6924", "outputIndexes": [ 1679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6925", "outputIndexes": [ 1680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6927", "outputIndexes": [ 1681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1681 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6928", "outputIndexes": [ 1682 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677, 1680, 1682, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6931", "outputIndexes": [ 1683 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1683 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6932", "outputIndexes": [ 1684 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1684 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6933", "outputIndexes": [ 1685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1685, 1684 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6934", "outputIndexes": [ 1686 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676, 1686, 1679 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": [ 1687 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1687, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": [ 1688 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1689 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674, 1689, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": [ 1690 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1690 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": [ 1691 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1692 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674, 22, 1692, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": [ 1693 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1691, 1693 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": [ 1694 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1694, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": [ 1695 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1675, 1695 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": [ 1696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1088658154, 655382, 163840, 0, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 3409 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3409 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3410 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3410 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1697 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1663, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1698 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1671, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1699 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1698, 1699, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": [ 1700 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1697, 1700 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": [ 1701 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": [ 1702 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": [ 1703 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1703 ] , "main_type": "NONE", "name": "Shape6826", "outputIndexes": [ 1704 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1703 ] , "main_type": "NONE", "name": "Rank6828", "outputIndexes": [ 1705 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1705, 1705 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6830", "outputIndexes": [ 1706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6831", "outputIndexes": [ 1707 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6833", "outputIndexes": [ 1708 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1708 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6834", "outputIndexes": [ 1709 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704, 1707, 1709, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6837", "outputIndexes": [ 1710 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1710 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6838", "outputIndexes": [ 1711 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1711 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6839", "outputIndexes": [ 1712 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 1711 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6840", "outputIndexes": [ 1713 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1703, 1713, 1706 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": [ 1714 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1714, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": [ 1715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1716 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701, 1716, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": [ 1717 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1717 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": [ 1718 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1719 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701, 22, 1719, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": [ 1720 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1718, 1720 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": [ 1721 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1721, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": [ 1722 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1702, 1722 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": [ 1723 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1089477376, 655382, 163840, 0, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 3413 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3413 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3414 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3414 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1724 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1663, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1725 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1671, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1726 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1725, 1726, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": [ 1727 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1724, 1727 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": [ 1728 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 1723, 1728, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.18/self_attn/Reshape_7_output_0", "outputIndexes": [ 1729 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3415 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3416 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3416 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1090296598, 3276822, 819200, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 3417 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3417 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3418 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3418 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1730 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1650, 1730 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_output_0", "outputIndexes": [ 1731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1731 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1094392620, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1732 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1732 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3419 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3419 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3420 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1094413100, 13434902, 3358720, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 3421 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3421 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3422 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3422 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1734 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1111206722, 13434902, 3358720, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 3425 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3425 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3426 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734, 1735 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": [ 1736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3427 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3427 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3428 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3428 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1128000344, 13434902, 3358720, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 3429 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3430 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1737 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1731, 1737 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_1_output_0", "outputIndexes": [ 1738 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/Reshape_output_0", "outputIndexes": [ 1739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1144793966, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1740 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3431 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3431 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3432 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1144814446, 3276822, 819200, 0, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 3433 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3433 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3434 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3434 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1741 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": [ 1742 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1742 ] , "main_type": "NONE", "name": "Shape7159", "outputIndexes": [ 1743 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1742 ] , "main_type": "NONE", "name": "Rank7161", "outputIndexes": [ 1744 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1744, 1744 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7163", "outputIndexes": [ 1745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7164", "outputIndexes": [ 1746 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7166", "outputIndexes": [ 1747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7167", "outputIndexes": [ 1748 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743, 1746, 1748, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7170", "outputIndexes": [ 1749 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1749 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7171", "outputIndexes": [ 1750 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 1750 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7173", "outputIndexes": [ 1751 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1742, 1751, 1745 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": [ 1752 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1752, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1753 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7181", "outputIndexes": [ 1754 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7184", "outputIndexes": [ 1755 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743, 1754, 1755, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7187", "outputIndexes": [ 1756 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1756 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7188", "outputIndexes": [ 1757 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1757 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7189", "outputIndexes": [ 1758 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 1757 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7190", "outputIndexes": [ 1759 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1742, 1759, 1745 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": [ 1760 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1761 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1753, 1761, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": [ 1762 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1762 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": [ 1763 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": [ 1764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": [ 1765 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1765 ] , "main_type": "NONE", "name": "Shape7291", "outputIndexes": [ 1766 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1765 ] , "main_type": "NONE", "name": "Rank7293", "outputIndexes": [ 1767 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1767, 1767 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7295", "outputIndexes": [ 1768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7296", "outputIndexes": [ 1769 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7298", "outputIndexes": [ 1770 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7299", "outputIndexes": [ 1771 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766, 1769, 1771, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7302", "outputIndexes": [ 1772 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1772 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7303", "outputIndexes": [ 1773 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1773 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7304", "outputIndexes": [ 1774 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1774, 1773 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7305", "outputIndexes": [ 1775 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1765, 1775, 1768 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": [ 1776 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1776, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": [ 1777 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1777, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1778 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 1778, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": [ 1779 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": [ 1780 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1777, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1781 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 22, 1781, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": [ 1782 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1780, 1782 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": [ 1783 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1783, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": [ 1784 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1764, 1784 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": [ 1785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1148910468, 655382, 163840, 0, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 3437 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3437 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3438 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3438 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1786 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1752, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1787 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1787, 1788, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": [ 1789 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1786, 1789 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": [ 1790 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": [ 1791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": [ 1792 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1792 ] , "main_type": "NONE", "name": "Shape7197", "outputIndexes": [ 1793 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1792 ] , "main_type": "NONE", "name": "Rank7199", "outputIndexes": [ 1794 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1794, 1794 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7201", "outputIndexes": [ 1795 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7202", "outputIndexes": [ 1796 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7204", "outputIndexes": [ 1797 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1797 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7205", "outputIndexes": [ 1798 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793, 1796, 1798, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7208", "outputIndexes": [ 1799 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1799 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7209", "outputIndexes": [ 1800 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1800 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7210", "outputIndexes": [ 1801 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 1800 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7211", "outputIndexes": [ 1802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 1802, 1795 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": [ 1803 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1803, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": [ 1804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1804, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1805 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 1805, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": [ 1806 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1806 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": [ 1807 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1804, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1808 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 22, 1808, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": [ 1809 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1807, 1809 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": [ 1810 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1810, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": [ 1811 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1791, 1811 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": [ 1812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1149729690, 655382, 163840, 0, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 3441 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3441 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3442 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3442 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1813 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1752, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1814 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1815 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1814, 1815, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": [ 1816 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1813, 1816 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": [ 1817 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785, 1812, 1817, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.19/self_attn/Reshape_7_output_0", "outputIndexes": [ 1818 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3443 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3443 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3444 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3444 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1150548912, 3276822, 819200, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 3445 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3445 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3446 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3446 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1819 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739, 1819 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_output_0", "outputIndexes": [ 1820 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1820 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1154644934, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1821 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3447 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3447 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3448 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3448 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1154665414, 13434902, 3358720, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 3449 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3449 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3450 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3450 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1822 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1822 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1823 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3448 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1171459036, 13434902, 3358720, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 3453 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3453 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3454 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3454 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1824 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1823, 1824 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": [ 1825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1825 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3456 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3456 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1188252658, 13434902, 3358720, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 3457 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3457 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3458 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1826 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1820, 1826 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_1_output_0", "outputIndexes": [ 1827 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/Reshape_output_0", "outputIndexes": [ 1828 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1828 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1205046280, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1829 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3459 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3459 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3460 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3460 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1205066760, 3276822, 819200, 0, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 3461 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3461 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3462 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3462 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1830 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": [ 1831 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1831 ] , "main_type": "NONE", "name": "Shape7530", "outputIndexes": [ 1832 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1831 ] , "main_type": "NONE", "name": "Rank7532", "outputIndexes": [ 1833 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1833, 1833 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7534", "outputIndexes": [ 1834 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7535", "outputIndexes": [ 1835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7537", "outputIndexes": [ 1836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7538", "outputIndexes": [ 1837 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832, 1835, 1837, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7541", "outputIndexes": [ 1838 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1838 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7542", "outputIndexes": [ 1839 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 1839 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7544", "outputIndexes": [ 1840 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831, 1840, 1834 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": [ 1841 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1842 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7552", "outputIndexes": [ 1843 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7555", "outputIndexes": [ 1844 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832, 1843, 1844, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7558", "outputIndexes": [ 1845 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7559", "outputIndexes": [ 1846 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1846 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7560", "outputIndexes": [ 1847 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 1846 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7561", "outputIndexes": [ 1848 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831, 1848, 1834 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": [ 1849 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1849, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1850 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1842, 1850, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": [ 1851 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830, 1851 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": [ 1852 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": [ 1853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": [ 1854 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1854 ] , "main_type": "NONE", "name": "Shape7662", "outputIndexes": [ 1855 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1854 ] , "main_type": "NONE", "name": "Rank7664", "outputIndexes": [ 1856 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1856, 1856 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7666", "outputIndexes": [ 1857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7667", "outputIndexes": [ 1858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1857, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7669", "outputIndexes": [ 1859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1859 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7670", "outputIndexes": [ 1860 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855, 1858, 1860, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7673", "outputIndexes": [ 1861 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1861 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7674", "outputIndexes": [ 1862 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1862 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7675", "outputIndexes": [ 1863 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1863, 1862 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7676", "outputIndexes": [ 1864 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1854, 1864, 1857 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": [ 1865 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": [ 1866 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1867 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 1867, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": [ 1868 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": [ 1869 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1870 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 22, 1870, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": [ 1871 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1869, 1871 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": [ 1872 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": [ 1873 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 1873 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": [ 1874 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3460 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1209162782, 655382, 163840, 0, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 3465 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3465 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3466 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3466 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1875 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1876 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1849, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1877 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1876, 1877, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": [ 1878 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1875, 1878 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": [ 1879 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": [ 1880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": [ 1881 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1881 ] , "main_type": "NONE", "name": "Shape7568", "outputIndexes": [ 1882 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1881 ] , "main_type": "NONE", "name": "Rank7570", "outputIndexes": [ 1883 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1883, 1883 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7572", "outputIndexes": [ 1884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7573", "outputIndexes": [ 1885 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7575", "outputIndexes": [ 1886 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1886 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7576", "outputIndexes": [ 1887 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 1885, 1887, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7579", "outputIndexes": [ 1888 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1888 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7580", "outputIndexes": [ 1889 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1889 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7581", "outputIndexes": [ 1890 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1890, 1889 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7582", "outputIndexes": [ 1891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1881, 1891, 1884 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": [ 1892 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1892, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": [ 1893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1894 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 1894, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": [ 1895 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1895 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": [ 1896 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1897 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 22, 1897, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": [ 1898 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1896, 1898 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": [ 1899 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1899, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": [ 1900 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880, 1900 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": [ 1901 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3460 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1209982004, 655382, 163840, 0, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 3469 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3469 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3470 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3470 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1902 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1903 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1849, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1904 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1903, 1904, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": [ 1905 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1902, 1905 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": [ 1906 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1874, 1901, 1906, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.20/self_attn/Reshape_7_output_0", "outputIndexes": [ 1907 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3471 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3471 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3472 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3472 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1210801226, 3276822, 819200, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 3473 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3473 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3474 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3474 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1908 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1828, 1908 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_output_0", "outputIndexes": [ 1909 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1214897248, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1910 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3475 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3475 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3476 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3476 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1214917728, 13434902, 3358720, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 3477 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3477 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3478 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3478 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1911 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1911 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1912 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3476 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1231711350, 13434902, 3358720, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 3481 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3481 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3482 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3482 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1913 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912, 1913 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": [ 1914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3483 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3483 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3484 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3484 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1248504972, 13434902, 3358720, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 3485 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3485 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3486 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1915 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909, 1915 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_1_output_0", "outputIndexes": [ 1916 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/Reshape_output_0", "outputIndexes": [ 1917 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1917 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1265298594, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1918 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3487 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3487 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3488 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3488 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1265319074, 3276822, 819200, 0, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 3489 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3489 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3490 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3490 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1919 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": [ 1920 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1920 ] , "main_type": "NONE", "name": "Shape7901", "outputIndexes": [ 1921 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1920 ] , "main_type": "NONE", "name": "Rank7903", "outputIndexes": [ 1922 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1922, 1922 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7905", "outputIndexes": [ 1923 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7906", "outputIndexes": [ 1924 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7908", "outputIndexes": [ 1925 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7909", "outputIndexes": [ 1926 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 1924, 1926, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7912", "outputIndexes": [ 1927 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7913", "outputIndexes": [ 1928 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 1928 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7915", "outputIndexes": [ 1929 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1929, 1923 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": [ 1930 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1931 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7923", "outputIndexes": [ 1932 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7926", "outputIndexes": [ 1933 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 1932, 1933, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7929", "outputIndexes": [ 1934 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1934 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7930", "outputIndexes": [ 1935 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1935 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7931", "outputIndexes": [ 1936 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 1935 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7932", "outputIndexes": [ 1937 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1937, 1923 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": [ 1938 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1938, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1939 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1931, 1939, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": [ 1940 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 1940 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": [ 1941 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": [ 1942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": [ 1943 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1943 ] , "main_type": "NONE", "name": "Shape8033", "outputIndexes": [ 1944 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1943 ] , "main_type": "NONE", "name": "Rank8035", "outputIndexes": [ 1945 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1945, 1945 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8037", "outputIndexes": [ 1946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8038", "outputIndexes": [ 1947 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8040", "outputIndexes": [ 1948 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8041", "outputIndexes": [ 1949 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944, 1947, 1949, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8044", "outputIndexes": [ 1950 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1950 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8045", "outputIndexes": [ 1951 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1951 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8046", "outputIndexes": [ 1952 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1952, 1951 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8047", "outputIndexes": [ 1953 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1943, 1953, 1946 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": [ 1954 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1954, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": [ 1955 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1956 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 1956, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": [ 1957 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1957 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": [ 1958 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1959 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 22, 1959, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": [ 1960 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1958, 1960 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": [ 1961 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": [ 1962 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1942, 1962 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": [ 1963 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3488 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1269415096, 655382, 163840, 0, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 3493 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3493 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3494 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3494 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1964 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1965 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1938, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1966 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1965, 1966, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": [ 1967 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1964, 1967 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": [ 1968 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": [ 1969 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": [ 1970 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1970 ] , "main_type": "NONE", "name": "Shape7939", "outputIndexes": [ 1971 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1970 ] , "main_type": "NONE", "name": "Rank7941", "outputIndexes": [ 1972 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1972, 1972 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7943", "outputIndexes": [ 1973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7944", "outputIndexes": [ 1974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7946", "outputIndexes": [ 1975 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7947", "outputIndexes": [ 1976 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 1974, 1976, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7950", "outputIndexes": [ 1977 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1977 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7951", "outputIndexes": [ 1978 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1978 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7952", "outputIndexes": [ 1979 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1979, 1978 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7953", "outputIndexes": [ 1980 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1970, 1980, 1973 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": [ 1981 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1981, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": [ 1982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1983 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 1983, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": [ 1984 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1984 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": [ 1985 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1986 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 22, 1986, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": [ 1987 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1985, 1987 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": [ 1988 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1988, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": [ 1989 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969, 1989 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": [ 1990 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3488 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1270234318, 655382, 163840, 0, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 3497 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3498 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3498 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1991 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1992 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1938, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1993 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1992, 1993, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": [ 1994 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 1994 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": [ 1995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1963, 1990, 1995, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.21/self_attn/Reshape_7_output_0", "outputIndexes": [ 1996 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3499 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3499 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3500 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3500 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1271053540, 3276822, 819200, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 3501 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3501 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3502 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1997 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1917, 1997 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_output_0", "outputIndexes": [ 1998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1275149562, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1999 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1999 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3503 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3503 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3504 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3504 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1275170042, 13434902, 3358720, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 3505 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3505 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3506 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3506 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2000 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2000 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2001 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3504 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1291963664, 13434902, 3358720, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 3509 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3509 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3510 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3510 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2002 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2001, 2002 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": [ 2003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2003 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3511 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3511 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3512 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3512 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1308757286, 13434902, 3358720, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 3513 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3514 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2004 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998, 2004 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_1_output_0", "outputIndexes": [ 2005 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/Reshape_output_0", "outputIndexes": [ 2006 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2006 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1325550908, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2007 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3515 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3515 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3516 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3516 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1325571388, 3276822, 819200, 0, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 3517 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3517 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3518 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3518 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2008 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": [ 2009 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2009 ] , "main_type": "NONE", "name": "Shape8272", "outputIndexes": [ 2010 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2009 ] , "main_type": "NONE", "name": "Rank8274", "outputIndexes": [ 2011 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2011, 2011 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8276", "outputIndexes": [ 2012 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8277", "outputIndexes": [ 2013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8279", "outputIndexes": [ 2014 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8280", "outputIndexes": [ 2015 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010, 2013, 2015, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8283", "outputIndexes": [ 2016 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2016 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8284", "outputIndexes": [ 2017 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 2017 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8286", "outputIndexes": [ 2018 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2009, 2018, 2012 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": [ 2019 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2019, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8294", "outputIndexes": [ 2021 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8297", "outputIndexes": [ 2022 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010, 2021, 2022, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8300", "outputIndexes": [ 2023 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2023 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8301", "outputIndexes": [ 2024 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2024 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8302", "outputIndexes": [ 2025 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 2024 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8303", "outputIndexes": [ 2026 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2009, 2026, 2012 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": [ 2027 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2028 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 2028, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": [ 2029 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2029 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": [ 2030 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": [ 2031 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": [ 2032 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2032 ] , "main_type": "NONE", "name": "Shape8404", "outputIndexes": [ 2033 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2032 ] , "main_type": "NONE", "name": "Rank8406", "outputIndexes": [ 2034 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2034, 2034 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8408", "outputIndexes": [ 2035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2035 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8409", "outputIndexes": [ 2036 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2035, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8411", "outputIndexes": [ 2037 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2037 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8412", "outputIndexes": [ 2038 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033, 2036, 2038, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8415", "outputIndexes": [ 2039 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2039 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8416", "outputIndexes": [ 2040 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2040 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8417", "outputIndexes": [ 2041 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2041, 2040 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8418", "outputIndexes": [ 2042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2032, 2042, 2035 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": [ 2043 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2043, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": [ 2044 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2045 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 2045, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": [ 2046 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2046 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": [ 2047 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2048 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 22, 2048, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": [ 2049 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2047, 2049 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": [ 2050 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": [ 2051 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2031, 2051 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": [ 2052 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3516 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1329667410, 655382, 163840, 0, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 3521 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3521 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3522 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3522 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2053 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2019, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2054 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 2055, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": [ 2056 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2053, 2056 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": [ 2057 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": [ 2058 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": [ 2059 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2059 ] , "main_type": "NONE", "name": "Shape8310", "outputIndexes": [ 2060 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2059 ] , "main_type": "NONE", "name": "Rank8312", "outputIndexes": [ 2061 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2061, 2061 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8314", "outputIndexes": [ 2062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8315", "outputIndexes": [ 2063 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8317", "outputIndexes": [ 2064 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8318", "outputIndexes": [ 2065 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060, 2063, 2065, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8321", "outputIndexes": [ 2066 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2066 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8322", "outputIndexes": [ 2067 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2067 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8323", "outputIndexes": [ 2068 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068, 2067 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8324", "outputIndexes": [ 2069 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059, 2069, 2062 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": [ 2070 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2070, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": [ 2071 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2072 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 2072, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": [ 2073 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2073 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": [ 2074 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2075 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 22, 2075, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": [ 2076 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2074, 2076 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": [ 2077 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": [ 2078 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058, 2078 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": [ 2079 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3516 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1330486632, 655382, 163840, 0, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 3525 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3525 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3526 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3526 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2080 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2019, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2081 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2082 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2081, 2082, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": [ 2083 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2080, 2083 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": [ 2084 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052, 2079, 2084, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.22/self_attn/Reshape_7_output_0", "outputIndexes": [ 2085 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3527 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3527 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3528 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3528 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1331305854, 3276822, 819200, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 3529 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3529 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3530 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3530 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2086 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2006, 2086 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_output_0", "outputIndexes": [ 2087 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1335401876, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2088 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3531 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3531 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3532 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3532 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1335422356, 13434902, 3358720, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 3533 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3533 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3534 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3534 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2089 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2089 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2090 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3532 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1352215978, 13434902, 3358720, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 3537 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3537 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3538 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3538 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2091 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2090, 2091 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": [ 2092 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3539 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3539 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3540 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3540 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1369009600, 13434902, 3358720, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 3541 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3542 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3542 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087, 2093 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_1_output_0", "outputIndexes": [ 2094 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/Reshape_output_0", "outputIndexes": [ 2095 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1385803222, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2096 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3543 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3543 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3544 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3544 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1385823702, 3276822, 819200, 0, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 3545 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3545 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3546 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3546 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2097 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": [ 2098 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2098 ] , "main_type": "NONE", "name": "Shape8643", "outputIndexes": [ 2099 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2098 ] , "main_type": "NONE", "name": "Rank8645", "outputIndexes": [ 2100 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2100, 2100 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8647", "outputIndexes": [ 2101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8648", "outputIndexes": [ 2102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8650", "outputIndexes": [ 2103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8651", "outputIndexes": [ 2104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099, 2102, 2104, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8654", "outputIndexes": [ 2105 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2105 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8655", "outputIndexes": [ 2106 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 2106 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8657", "outputIndexes": [ 2107 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 2107, 2101 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": [ 2108 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2108, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2109 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8665", "outputIndexes": [ 2110 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8668", "outputIndexes": [ 2111 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099, 2110, 2111, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8671", "outputIndexes": [ 2112 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2112 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8672", "outputIndexes": [ 2113 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2113 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8673", "outputIndexes": [ 2114 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 2113 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8674", "outputIndexes": [ 2115 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 2115, 2101 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": [ 2116 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2116, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2117 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2109, 2117, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": [ 2118 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2118 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": [ 2119 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": [ 2120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": [ 2121 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2121 ] , "main_type": "NONE", "name": "Shape8775", "outputIndexes": [ 2122 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2121 ] , "main_type": "NONE", "name": "Rank8777", "outputIndexes": [ 2123 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2123, 2123 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8779", "outputIndexes": [ 2124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8780", "outputIndexes": [ 2125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8782", "outputIndexes": [ 2126 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2126 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8783", "outputIndexes": [ 2127 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122, 2125, 2127, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8786", "outputIndexes": [ 2128 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2128 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8787", "outputIndexes": [ 2129 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2129 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8788", "outputIndexes": [ 2130 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2130, 2129 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8789", "outputIndexes": [ 2131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2121, 2131, 2124 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": [ 2132 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2132, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": [ 2133 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2134 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2134, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": [ 2135 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2135 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": [ 2136 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 22, 2137, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": [ 2138 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2136, 2138 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": [ 2139 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2139, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": [ 2140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120, 2140 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": [ 2141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3544 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1389919724, 655382, 163840, 0, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 3549 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3549 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3550 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3550 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2142 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2108, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2143 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2116, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2143, 2144, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": [ 2145 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2142, 2145 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": [ 2146 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": [ 2147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": [ 2148 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2148 ] , "main_type": "NONE", "name": "Shape8681", "outputIndexes": [ 2149 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2148 ] , "main_type": "NONE", "name": "Rank8683", "outputIndexes": [ 2150 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2150, 2150 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8685", "outputIndexes": [ 2151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8686", "outputIndexes": [ 2152 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8688", "outputIndexes": [ 2153 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2153 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8689", "outputIndexes": [ 2154 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149, 2152, 2154, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8692", "outputIndexes": [ 2155 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2155 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8693", "outputIndexes": [ 2156 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2156 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8694", "outputIndexes": [ 2157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157, 2156 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8695", "outputIndexes": [ 2158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2148, 2158, 2151 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": [ 2159 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2159, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": [ 2160 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2161 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 2161, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": [ 2162 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2162 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": [ 2163 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2164 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 22, 2164, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": [ 2165 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2163, 2165 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": [ 2166 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2166, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": [ 2167 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 2167 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": [ 2168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3544 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1390738946, 655382, 163840, 0, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 3553 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3553 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3554 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3554 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2169 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2108, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2170 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2116, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 2171, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": [ 2172 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2169, 2172 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": [ 2173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2141, 2168, 2173, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.23/self_attn/Reshape_7_output_0", "outputIndexes": [ 2174 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3555 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3556 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1391558168, 3276822, 819200, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 3557 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3557 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3558 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3558 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2175 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_output_0", "outputIndexes": [ 2176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2176 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1395654190, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2177 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3559 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3560 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3560 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1395674670, 13434902, 3358720, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 3561 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3561 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3562 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3562 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2178 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2179 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3560 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1412468292, 13434902, 3358720, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 3565 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3565 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3566 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3566 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2180 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2179, 2180 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": [ 2181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2181 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3567 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3567 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3568 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3568 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1429261914, 13434902, 3358720, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 3569 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3570 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2182 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2176, 2182 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_1_output_0", "outputIndexes": [ 2183 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/Reshape_output_0", "outputIndexes": [ 2184 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1446055536, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2185 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3571 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3571 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3572 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1446076016, 3276822, 819200, 0, 0 ] } , "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": [ 3573 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3573 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3574 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3574 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2186 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": [ 2187 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2187 ] , "main_type": "NONE", "name": "Shape9014", "outputIndexes": [ 2188 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2187 ] , "main_type": "NONE", "name": "Rank9016", "outputIndexes": [ 2189 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2189, 2189 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9018", "outputIndexes": [ 2190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9019", "outputIndexes": [ 2191 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9021", "outputIndexes": [ 2192 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2192 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9022", "outputIndexes": [ 2193 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 2191, 2193, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9025", "outputIndexes": [ 2194 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2194 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9026", "outputIndexes": [ 2195 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2195, 2195 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9028", "outputIndexes": [ 2196 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187, 2196, 2190 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": [ 2197 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2197, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2198 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9036", "outputIndexes": [ 2199 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2192 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9039", "outputIndexes": [ 2200 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 2199, 2200, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9042", "outputIndexes": [ 2201 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2201 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9043", "outputIndexes": [ 2202 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2202 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9044", "outputIndexes": [ 2203 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 2202 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9045", "outputIndexes": [ 2204 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187, 2204, 2190 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": [ 2205 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2205, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2206 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198, 2206, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": [ 2207 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186, 2207 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": [ 2208 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": [ 2209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": [ 2210 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2210 ] , "main_type": "NONE", "name": "Shape9146", "outputIndexes": [ 2211 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2210 ] , "main_type": "NONE", "name": "Rank9148", "outputIndexes": [ 2212 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2212, 2212 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9150", "outputIndexes": [ 2213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9151", "outputIndexes": [ 2214 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9153", "outputIndexes": [ 2215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9154", "outputIndexes": [ 2216 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 2214, 2216, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9157", "outputIndexes": [ 2217 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2217 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9158", "outputIndexes": [ 2218 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2218 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9159", "outputIndexes": [ 2219 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2219, 2218 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9160", "outputIndexes": [ 2220 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2210, 2220, 2213 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": [ 2221 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2221, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": [ 2222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2222, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2223 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208, 2223, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": [ 2224 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2224 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": [ 2225 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2222, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2226 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208, 22, 2226, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": [ 2227 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 2227 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": [ 2228 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2228, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": [ 2229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209, 2229 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": [ 2230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1450172038, 655382, 163840, 0, 0 ] } , "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": [ 3577 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3577 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3578 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3578 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2231 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2197, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2232 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2205, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2232, 2233, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": [ 2234 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2231, 2234 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": [ 2235 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": [ 2236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": [ 2237 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2237 ] , "main_type": "NONE", "name": "Shape9052", "outputIndexes": [ 2238 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2237 ] , "main_type": "NONE", "name": "Rank9054", "outputIndexes": [ 2239 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2239, 2239 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9056", "outputIndexes": [ 2240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9057", "outputIndexes": [ 2241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9059", "outputIndexes": [ 2242 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2242 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9060", "outputIndexes": [ 2243 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238, 2241, 2243, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9063", "outputIndexes": [ 2244 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9064", "outputIndexes": [ 2245 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2245 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9065", "outputIndexes": [ 2246 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2246, 2245 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9066", "outputIndexes": [ 2247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2237, 2247, 2240 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": [ 2248 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2248, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": [ 2249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2250 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235, 2250, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": [ 2251 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2251 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": [ 2252 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235, 22, 2253, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": [ 2254 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2252, 2254 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": [ 2255 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2255, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": [ 2256 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236, 2256 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": [ 2257 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1450991260, 655382, 163840, 0, 0 ] } , "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": [ 3581 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3581 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3582 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3582 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2258 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2197, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2259 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2205, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2260 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2259, 2260, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": [ 2261 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2258, 2261 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": [ 2262 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230, 2257, 2262, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.24/self_attn/Reshape_7_output_0", "outputIndexes": [ 2263 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3583 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3584 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3584 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1451810482, 3276822, 819200, 0, 0 ] } , "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": [ 3585 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3585 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3586 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3586 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2264 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184, 2264 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_output_0", "outputIndexes": [ 2265 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1455906504, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2266 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2266 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3587 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3587 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3588 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3588 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1455926984, 13434902, 3358720, 0, 0 ] } , "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": [ 3589 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3589 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3590 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3590 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2267 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2267 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2268 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3588 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1472720606, 13434902, 3358720, 0, 0 ] } , "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": [ 3593 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3593 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3594 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3594 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268, 2269 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": [ 2270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3595 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3595 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3596 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3596 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1489514228, 13434902, 3358720, 0, 0 ] } , "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": [ 3597 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3598 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2271 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265, 2271 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_1_output_0", "outputIndexes": [ 2272 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/Reshape_output_0", "outputIndexes": [ 2273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1506307850, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2274 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3599 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3599 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3600 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3600 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1506328330, 3276822, 819200, 0, 0 ] } , "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": [ 3601 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3601 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3602 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3602 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2275 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": [ 2276 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2276 ] , "main_type": "NONE", "name": "Shape9385", "outputIndexes": [ 2277 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2276 ] , "main_type": "NONE", "name": "Rank9387", "outputIndexes": [ 2278 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2278, 2278 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9389", "outputIndexes": [ 2279 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9390", "outputIndexes": [ 2280 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9392", "outputIndexes": [ 2281 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9393", "outputIndexes": [ 2282 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277, 2280, 2282, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9396", "outputIndexes": [ 2283 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2283 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9397", "outputIndexes": [ 2284 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 2284 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9399", "outputIndexes": [ 2285 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 2285, 2279 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": [ 2286 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2287 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9407", "outputIndexes": [ 2288 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9410", "outputIndexes": [ 2289 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277, 2288, 2289, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9413", "outputIndexes": [ 2290 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2290 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9414", "outputIndexes": [ 2291 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2291 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9415", "outputIndexes": [ 2292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 2291 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9416", "outputIndexes": [ 2293 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 2293, 2279 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": [ 2294 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2294, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2295 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2287, 2295, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": [ 2296 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275, 2296 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": [ 2297 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": [ 2298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": [ 2299 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2299 ] , "main_type": "NONE", "name": "Shape9517", "outputIndexes": [ 2300 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2299 ] , "main_type": "NONE", "name": "Rank9519", "outputIndexes": [ 2301 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2301, 2301 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9521", "outputIndexes": [ 2302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9522", "outputIndexes": [ 2303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9524", "outputIndexes": [ 2304 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9525", "outputIndexes": [ 2305 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300, 2303, 2305, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9528", "outputIndexes": [ 2306 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2306 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9529", "outputIndexes": [ 2307 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2307 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9530", "outputIndexes": [ 2308 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308, 2307 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9531", "outputIndexes": [ 2309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 2309, 2302 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": [ 2310 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2310, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": [ 2311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2312 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 2312, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": [ 2313 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2313 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": [ 2314 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2315 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 22, 2315, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": [ 2316 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2314, 2316 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": [ 2317 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2317, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": [ 2318 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2298, 2318 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": [ 2319 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3600 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1510424352, 655382, 163840, 0, 0 ] } , "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": [ 3605 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3605 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3606 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3606 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2320 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2321 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2294, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2321, 2322, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": [ 2323 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2320, 2323 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": [ 2324 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": [ 2325 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": [ 2326 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2326 ] , "main_type": "NONE", "name": "Shape9423", "outputIndexes": [ 2327 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2326 ] , "main_type": "NONE", "name": "Rank9425", "outputIndexes": [ 2328 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2328, 2328 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9427", "outputIndexes": [ 2329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9428", "outputIndexes": [ 2330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9430", "outputIndexes": [ 2331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9431", "outputIndexes": [ 2332 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327, 2330, 2332, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9434", "outputIndexes": [ 2333 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9435", "outputIndexes": [ 2334 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2334 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9436", "outputIndexes": [ 2335 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2335, 2334 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9437", "outputIndexes": [ 2336 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2326, 2336, 2329 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": [ 2337 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2337, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": [ 2338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2339 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 2339, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": [ 2340 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": [ 2341 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2342 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 22, 2342, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": [ 2343 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2341, 2343 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": [ 2344 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2344, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": [ 2345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2325, 2345 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": [ 2346 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3600 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1511243574, 655382, 163840, 0, 0 ] } , "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": [ 3609 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3609 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3610 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3610 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2347 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2348 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2294, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2349 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2348, 2349, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": [ 2350 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2347, 2350 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": [ 2351 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2319, 2346, 2351, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.25/self_attn/Reshape_7_output_0", "outputIndexes": [ 2352 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2352 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3611 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3611 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3612 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3612 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1512062796, 3276822, 819200, 0, 0 ] } , "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": [ 3613 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3613 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3614 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3614 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2353 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273, 2353 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_output_0", "outputIndexes": [ 2354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1516158818, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2355 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3615 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3615 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3616 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3616 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1516179298, 13434902, 3358720, 0, 0 ] } , "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": [ 3617 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3617 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3618 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3618 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2356 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2356 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2357 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3616 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1532972920, 13434902, 3358720, 0, 0 ] } , "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": [ 3621 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3621 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3622 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3622 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2358 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2357, 2358 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": [ 2359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2359 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3623 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3624 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3624 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1549766542, 13434902, 3358720, 0, 0 ] } , "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": [ 3625 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3625 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3626 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354, 2360 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_1_output_0", "outputIndexes": [ 2361 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/Reshape_output_0", "outputIndexes": [ 2362 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2362 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1566560164, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.26/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2363 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3627 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3628 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3628 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1566580644, 3276822, 819200, 0, 0 ] } , "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": [ 3629 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3629 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3630 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3630 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2364 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_output_0", "outputIndexes": [ 2365 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2365 ] , "main_type": "NONE", "name": "Shape9756", "outputIndexes": [ 2366 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2365 ] , "main_type": "NONE", "name": "Rank9758", "outputIndexes": [ 2367 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2367, 2367 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9760", "outputIndexes": [ 2368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9761", "outputIndexes": [ 2369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9763", "outputIndexes": [ 2370 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9764", "outputIndexes": [ 2371 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366, 2369, 2371, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9767", "outputIndexes": [ 2372 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9768", "outputIndexes": [ 2373 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 2373 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9770", "outputIndexes": [ 2374 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365, 2374, 2368 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_output_0", "outputIndexes": [ 2375 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9778", "outputIndexes": [ 2377 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9781", "outputIndexes": [ 2378 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366, 2377, 2378, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9784", "outputIndexes": [ 2379 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9785", "outputIndexes": [ 2380 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2380 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9786", "outputIndexes": [ 2381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381, 2380 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9787", "outputIndexes": [ 2382 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365, 2382, 2368 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_1_output_0", "outputIndexes": [ 2383 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2384 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2376, 2384, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_output_0", "outputIndexes": [ 2385 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364, 2385 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_output_0", "outputIndexes": [ 2386 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_output_0", "outputIndexes": [ 2387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_2_output_0", "outputIndexes": [ 2388 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2388 ] , "main_type": "NONE", "name": "Shape9888", "outputIndexes": [ 2389 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2388 ] , "main_type": "NONE", "name": "Rank9890", "outputIndexes": [ 2390 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390, 2390 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9892", "outputIndexes": [ 2391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2391 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9893", "outputIndexes": [ 2392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2391, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9895", "outputIndexes": [ 2393 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2393 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9896", "outputIndexes": [ 2394 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2389, 2392, 2394, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9899", "outputIndexes": [ 2395 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9900", "outputIndexes": [ 2396 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2396 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9901", "outputIndexes": [ 2397 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 2396 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9902", "outputIndexes": [ 2398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2388, 2398, 2391 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_2_output_0", "outputIndexes": [ 2399 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_output_0", "outputIndexes": [ 2400 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2400, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2401 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386, 2401, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_1_output_0", "outputIndexes": [ 2402 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2402 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_output_0", "outputIndexes": [ 2403 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2400, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2404 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386, 22, 2404, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_output_0", "outputIndexes": [ 2405 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2403, 2405 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_3_output_0", "outputIndexes": [ 2406 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_1_output_0", "outputIndexes": [ 2407 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2387, 2407 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_output_0", "outputIndexes": [ 2408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3628 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1570676666, 655382, 163840, 0, 0 ] } , "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": [ 3633 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3633 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3634 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3634 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2410 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2410, 2411, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_1_output_0", "outputIndexes": [ 2412 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2409, 2412 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_1_output_0", "outputIndexes": [ 2413 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_2_output_0", "outputIndexes": [ 2414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_3_output_0", "outputIndexes": [ 2415 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2415 ] , "main_type": "NONE", "name": "Shape9794", "outputIndexes": [ 2416 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2415 ] , "main_type": "NONE", "name": "Rank9796", "outputIndexes": [ 2417 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2417, 2417 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9798", "outputIndexes": [ 2418 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2418 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9799", "outputIndexes": [ 2419 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2418, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9801", "outputIndexes": [ 2420 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2420 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9802", "outputIndexes": [ 2421 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2416, 2419, 2421, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9805", "outputIndexes": [ 2422 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2422 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9806", "outputIndexes": [ 2423 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2423 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9807", "outputIndexes": [ 2424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424, 2423 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9808", "outputIndexes": [ 2425 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2415, 2425, 2418 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_3_output_0", "outputIndexes": [ 2426 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_1_output_0", "outputIndexes": [ 2427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2428 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413, 2428, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_3_output_0", "outputIndexes": [ 2429 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2429 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_1_output_0", "outputIndexes": [ 2430 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2431 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413, 22, 2431, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_2_output_0", "outputIndexes": [ 2432 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2430, 2432 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_4_output_0", "outputIndexes": [ 2433 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2433, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_3_output_0", "outputIndexes": [ 2434 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2414, 2434 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_1_output_0", "outputIndexes": [ 2435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3628 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1571495888, 655382, 163840, 0, 0 ] } , "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": [ 3637 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3637 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3638 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3638 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2436 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2437 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2438 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437, 2438, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_2_output_0", "outputIndexes": [ 2439 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2436, 2439 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_2_output_0", "outputIndexes": [ 2440 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408, 2435, 2440, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.26/self_attn/Reshape_7_output_0", "outputIndexes": [ 2441 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3639 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3640 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3640 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1572315110, 3276822, 819200, 0, 0 ] } , "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": [ 3641 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3642 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2442 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2362, 2442 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_output_0", "outputIndexes": [ 2443 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1576411132, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.26/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2444 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2444 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3643 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3643 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3644 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3644 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1576431612, 13434902, 3358720, 0, 0 ] } , "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": [ 3645 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3645 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3646 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3646 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2445 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2445 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.26/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2446 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3644 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1593225234, 13434902, 3358720, 0, 0 ] } , "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": [ 3649 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3649 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3650 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3650 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2447 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2446, 2447 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/mlp/Mul_output_0", "outputIndexes": [ 2448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2448 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3651 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3651 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3652 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3652 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1610018856, 13434902, 3358720, 0, 0 ] } , "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": [ 3653 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3653 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3654 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443, 2449 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_1_output_0", "outputIndexes": [ 2450 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/Reshape_output_0", "outputIndexes": [ 2451 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1626812478, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.27/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2452 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2452 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3655 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3655 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3656 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3656 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1626832958, 3276822, 819200, 0, 0 ] } , "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": [ 3657 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3657 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3658 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3658 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2452 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_output_0", "outputIndexes": [ 2454 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2454 ] , "main_type": "NONE", "name": "Shape10127", "outputIndexes": [ 2455 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2454 ] , "main_type": "NONE", "name": "Rank10129", "outputIndexes": [ 2456 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456, 2456 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10131", "outputIndexes": [ 2457 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10132", "outputIndexes": [ 2458 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10134", "outputIndexes": [ 2459 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2459 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10135", "outputIndexes": [ 2460 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455, 2458, 2460, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10138", "outputIndexes": [ 2461 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10139", "outputIndexes": [ 2462 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2462, 2462 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10141", "outputIndexes": [ 2463 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454, 2463, 2457 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_output_0", "outputIndexes": [ 2464 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2465 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10149", "outputIndexes": [ 2466 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2459 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10152", "outputIndexes": [ 2467 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455, 2466, 2467, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10155", "outputIndexes": [ 2468 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10156", "outputIndexes": [ 2469 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2469 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10157", "outputIndexes": [ 2470 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 2469 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10158", "outputIndexes": [ 2471 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454, 2471, 2457 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_1_output_0", "outputIndexes": [ 2472 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2473 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465, 2473, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_output_0", "outputIndexes": [ 2474 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2453, 2474 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_output_0", "outputIndexes": [ 2475 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_output_0", "outputIndexes": [ 2476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_2_output_0", "outputIndexes": [ 2477 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2477 ] , "main_type": "NONE", "name": "Shape10259", "outputIndexes": [ 2478 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2477 ] , "main_type": "NONE", "name": "Rank10261", "outputIndexes": [ 2479 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2479, 2479 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10263", "outputIndexes": [ 2480 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10264", "outputIndexes": [ 2481 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10266", "outputIndexes": [ 2482 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2482 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10267", "outputIndexes": [ 2483 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 2481, 2483, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10270", "outputIndexes": [ 2484 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2484 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10271", "outputIndexes": [ 2485 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2485 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10272", "outputIndexes": [ 2486 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2486, 2485 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10273", "outputIndexes": [ 2487 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 2487, 2480 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_2_output_0", "outputIndexes": [ 2488 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_output_0", "outputIndexes": [ 2489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2490 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 2490, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_1_output_0", "outputIndexes": [ 2491 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2491 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_output_0", "outputIndexes": [ 2492 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2493 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 22, 2493, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_output_0", "outputIndexes": [ 2494 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2492, 2494 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_3_output_0", "outputIndexes": [ 2495 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_1_output_0", "outputIndexes": [ 2496 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476, 2496 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_output_0", "outputIndexes": [ 2497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3656 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1630928980, 655382, 163840, 0, 0 ] } , "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": [ 3661 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3661 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3662 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3662 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2498 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2499 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2499, 2500, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_1_output_0", "outputIndexes": [ 2501 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2498, 2501 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_1_output_0", "outputIndexes": [ 2502 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_2_output_0", "outputIndexes": [ 2503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_3_output_0", "outputIndexes": [ 2504 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2504 ] , "main_type": "NONE", "name": "Shape10165", "outputIndexes": [ 2505 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2504 ] , "main_type": "NONE", "name": "Rank10167", "outputIndexes": [ 2506 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2506, 2506 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10169", "outputIndexes": [ 2507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2507 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10170", "outputIndexes": [ 2508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2507, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10172", "outputIndexes": [ 2509 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2509 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10173", "outputIndexes": [ 2510 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505, 2508, 2510, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10176", "outputIndexes": [ 2511 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2511 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10177", "outputIndexes": [ 2512 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2512 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10178", "outputIndexes": [ 2513 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2513, 2512 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10179", "outputIndexes": [ 2514 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504, 2514, 2507 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_3_output_0", "outputIndexes": [ 2515 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2515, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_1_output_0", "outputIndexes": [ 2516 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2517 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502, 2517, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_3_output_0", "outputIndexes": [ 2518 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2518 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_1_output_0", "outputIndexes": [ 2519 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2520 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502, 22, 2520, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_2_output_0", "outputIndexes": [ 2521 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519, 2521 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_4_output_0", "outputIndexes": [ 2522 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2522, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_3_output_0", "outputIndexes": [ 2523 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2503, 2523 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_1_output_0", "outputIndexes": [ 2524 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3656 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1631748202, 655382, 163840, 0, 0 ] } , "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": [ 3665 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3665 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3666 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3666 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2525 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2526 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2526, 2527, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_2_output_0", "outputIndexes": [ 2528 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2525, 2528 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_2_output_0", "outputIndexes": [ 2529 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2497, 2524, 2529, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.27/self_attn/Reshape_7_output_0", "outputIndexes": [ 2530 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2530 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3667 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3668 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3668 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1632567424, 3276822, 819200, 0, 0 ] } , "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": [ 3669 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3669 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3670 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3670 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2531 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 2531 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_output_0", "outputIndexes": [ 2532 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1636663446, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.27/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2533 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3671 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3672 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3672 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1636683926, 13434902, 3358720, 0, 0 ] } , "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": [ 3673 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3673 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3674 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3674 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2534 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2534 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.27/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2535 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3672 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1653477548, 13434902, 3358720, 0, 0 ] } , "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": [ 3677 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3677 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3678 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3678 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2536 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2535, 2536 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/mlp/Mul_output_0", "outputIndexes": [ 2537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2537 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3679 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3679 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3680 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3680 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1670271170, 13434902, 3358720, 0, 0 ] } , "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": [ 3681 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3681 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3682 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2538 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532, 2538 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_1_output_0", "outputIndexes": [ 2539 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/Reshape_output_0", "outputIndexes": [ 2540 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2540 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1687064792, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.28/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2541 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3683 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3683 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3684 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3684 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1687085272, 3276822, 819200, 0, 0 ] } , "name": "/layers.28/self_attn/q_proj/Linear", "outputIndexes": [ 3685 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3685 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3686 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3686 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2542 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_output_0", "outputIndexes": [ 2543 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2543 ] , "main_type": "NONE", "name": "Shape10498", "outputIndexes": [ 2544 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2543 ] , "main_type": "NONE", "name": "Rank10500", "outputIndexes": [ 2545 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2545, 2545 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10502", "outputIndexes": [ 2546 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10503", "outputIndexes": [ 2547 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10505", "outputIndexes": [ 2548 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10506", "outputIndexes": [ 2549 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 2547, 2549, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10509", "outputIndexes": [ 2550 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2550 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10510", "outputIndexes": [ 2551 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551, 2551 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10512", "outputIndexes": [ 2552 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2552, 2546 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_output_0", "outputIndexes": [ 2553 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2553, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2554 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10520", "outputIndexes": [ 2555 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10523", "outputIndexes": [ 2556 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 2555, 2556, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10526", "outputIndexes": [ 2557 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10527", "outputIndexes": [ 2558 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2558 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10528", "outputIndexes": [ 2559 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559, 2558 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10529", "outputIndexes": [ 2560 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2560, 2546 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_1_output_0", "outputIndexes": [ 2561 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2562 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2554, 2562, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_output_0", "outputIndexes": [ 2563 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2542, 2563 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_output_0", "outputIndexes": [ 2564 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_output_0", "outputIndexes": [ 2565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_2_output_0", "outputIndexes": [ 2566 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2566 ] , "main_type": "NONE", "name": "Shape10630", "outputIndexes": [ 2567 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2566 ] , "main_type": "NONE", "name": "Rank10632", "outputIndexes": [ 2568 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2568, 2568 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10634", "outputIndexes": [ 2569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2569 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10635", "outputIndexes": [ 2570 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2569, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10637", "outputIndexes": [ 2571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2571 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10638", "outputIndexes": [ 2572 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567, 2570, 2572, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10641", "outputIndexes": [ 2573 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10642", "outputIndexes": [ 2574 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2574 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10643", "outputIndexes": [ 2575 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2575, 2574 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10644", "outputIndexes": [ 2576 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2566, 2576, 2569 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_2_output_0", "outputIndexes": [ 2577 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2577, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_output_0", "outputIndexes": [ 2578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2579 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564, 2579, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_1_output_0", "outputIndexes": [ 2580 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2580 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_output_0", "outputIndexes": [ 2581 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2582 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564, 22, 2582, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_output_0", "outputIndexes": [ 2583 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581, 2583 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_3_output_0", "outputIndexes": [ 2584 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_1_output_0", "outputIndexes": [ 2585 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565, 2585 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_output_0", "outputIndexes": [ 2586 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3684 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1691181294, 655382, 163840, 0, 0 ] } , "name": "/layers.28/self_attn/k_proj/Linear", "outputIndexes": [ 3689 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3689 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3690 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3690 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2587 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2553, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2588 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2588, 2589, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_1_output_0", "outputIndexes": [ 2590 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587, 2590 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_1_output_0", "outputIndexes": [ 2591 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_2_output_0", "outputIndexes": [ 2592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_3_output_0", "outputIndexes": [ 2593 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2593 ] , "main_type": "NONE", "name": "Shape10536", "outputIndexes": [ 2594 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2593 ] , "main_type": "NONE", "name": "Rank10538", "outputIndexes": [ 2595 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2595, 2595 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10540", "outputIndexes": [ 2596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2596 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10541", "outputIndexes": [ 2597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2596, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10543", "outputIndexes": [ 2598 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2598 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10544", "outputIndexes": [ 2599 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 2597, 2599, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10547", "outputIndexes": [ 2600 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2600 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10548", "outputIndexes": [ 2601 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2601 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10549", "outputIndexes": [ 2602 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 2601 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10550", "outputIndexes": [ 2603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2593, 2603, 2596 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_3_output_0", "outputIndexes": [ 2604 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2604, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_1_output_0", "outputIndexes": [ 2605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2606 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591, 2606, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_3_output_0", "outputIndexes": [ 2607 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_1_output_0", "outputIndexes": [ 2608 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2609 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591, 22, 2609, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_2_output_0", "outputIndexes": [ 2610 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2608, 2610 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_4_output_0", "outputIndexes": [ 2611 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2611, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_3_output_0", "outputIndexes": [ 2612 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592, 2612 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_1_output_0", "outputIndexes": [ 2613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3684 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1692000516, 655382, 163840, 0, 0 ] } , "name": "/layers.28/self_attn/v_proj/Linear", "outputIndexes": [ 3693 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3693 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3694 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3694 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2614 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2553, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2615 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2616 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2615, 2616, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_2_output_0", "outputIndexes": [ 2617 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2614, 2617 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_2_output_0", "outputIndexes": [ 2618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2586, 2613, 2618, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.28/self_attn/Reshape_7_output_0", "outputIndexes": [ 2619 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3695 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3695 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3696 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3696 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1692819738, 3276822, 819200, 0, 0 ] } , "name": "/layers.28/self_attn/o_proj/Linear", "outputIndexes": [ 3697 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3697 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3698 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3698 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2620 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2540, 2620 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_output_0", "outputIndexes": [ 2621 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1696915760, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.28/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2622 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3699 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3699 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3700 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3700 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1696936240, 13434902, 3358720, 0, 0 ] } , "name": "/layers.28/mlp/gate_proj/Linear", "outputIndexes": [ 3701 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3701 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3702 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3702 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2623 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.28/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2624 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3700 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1713729862, 13434902, 3358720, 0, 0 ] } , "name": "/layers.28/mlp/up_proj/Linear", "outputIndexes": [ 3705 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3705 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3706 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3706 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2625 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624, 2625 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/mlp/Mul_output_0", "outputIndexes": [ 2626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3707 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3707 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3708 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3708 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1730523484, 13434902, 3358720, 0, 0 ] } , "name": "/layers.28/mlp/down_proj/Linear", "outputIndexes": [ 3709 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3710 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621, 2627 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_1_output_0", "outputIndexes": [ 2628 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2628, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/Reshape_output_0", "outputIndexes": [ 2629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1747317106, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.29/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2630 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3711 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3711 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3712 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3712 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1747337586, 3276822, 819200, 0, 0 ] } , "name": "/layers.29/self_attn/q_proj/Linear", "outputIndexes": [ 3713 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3713 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3714 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3714 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2631 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_output_0", "outputIndexes": [ 2632 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2632 ] , "main_type": "NONE", "name": "Shape10869", "outputIndexes": [ 2633 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2632 ] , "main_type": "NONE", "name": "Rank10871", "outputIndexes": [ 2634 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2634, 2634 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10873", "outputIndexes": [ 2635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10874", "outputIndexes": [ 2636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10876", "outputIndexes": [ 2637 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10877", "outputIndexes": [ 2638 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633, 2636, 2638, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10880", "outputIndexes": [ 2639 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2639 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10881", "outputIndexes": [ 2640 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640, 2640 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10883", "outputIndexes": [ 2641 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2632, 2641, 2635 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_output_0", "outputIndexes": [ 2642 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10891", "outputIndexes": [ 2644 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10894", "outputIndexes": [ 2645 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633, 2644, 2645, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10897", "outputIndexes": [ 2646 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2646 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10898", "outputIndexes": [ 2647 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2647 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10899", "outputIndexes": [ 2648 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2648, 2647 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10900", "outputIndexes": [ 2649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2632, 2649, 2635 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_1_output_0", "outputIndexes": [ 2650 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2651 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2643, 2651, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_output_0", "outputIndexes": [ 2652 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2631, 2652 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_output_0", "outputIndexes": [ 2653 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_output_0", "outputIndexes": [ 2654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_2_output_0", "outputIndexes": [ 2655 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2655 ] , "main_type": "NONE", "name": "Shape11001", "outputIndexes": [ 2656 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2655 ] , "main_type": "NONE", "name": "Rank11003", "outputIndexes": [ 2657 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2657, 2657 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11005", "outputIndexes": [ 2658 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11006", "outputIndexes": [ 2659 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11008", "outputIndexes": [ 2660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2660 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11009", "outputIndexes": [ 2661 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656, 2659, 2661, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11012", "outputIndexes": [ 2662 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2662 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11013", "outputIndexes": [ 2663 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2663 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11014", "outputIndexes": [ 2664 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2664, 2663 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11015", "outputIndexes": [ 2665 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2655, 2665, 2658 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_2_output_0", "outputIndexes": [ 2666 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2666, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_output_0", "outputIndexes": [ 2667 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2667, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2668 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 2668, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_1_output_0", "outputIndexes": [ 2669 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2669 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_output_0", "outputIndexes": [ 2670 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2667, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2671 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 22, 2671, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_output_0", "outputIndexes": [ 2672 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2670, 2672 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_3_output_0", "outputIndexes": [ 2673 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2673, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_1_output_0", "outputIndexes": [ 2674 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654, 2674 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_output_0", "outputIndexes": [ 2675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3712 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1751433608, 655382, 163840, 0, 0 ] } , "name": "/layers.29/self_attn/k_proj/Linear", "outputIndexes": [ 3717 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3717 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3718 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3718 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2676 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2677, 2678, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_1_output_0", "outputIndexes": [ 2679 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2676, 2679 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_1_output_0", "outputIndexes": [ 2680 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_2_output_0", "outputIndexes": [ 2681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_3_output_0", "outputIndexes": [ 2682 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2682 ] , "main_type": "NONE", "name": "Shape10907", "outputIndexes": [ 2683 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2682 ] , "main_type": "NONE", "name": "Rank10909", "outputIndexes": [ 2684 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2684, 2684 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10911", "outputIndexes": [ 2685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10912", "outputIndexes": [ 2686 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10914", "outputIndexes": [ 2687 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10915", "outputIndexes": [ 2688 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2683, 2686, 2688, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10918", "outputIndexes": [ 2689 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2689 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10919", "outputIndexes": [ 2690 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2690 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10920", "outputIndexes": [ 2691 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691, 2690 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10921", "outputIndexes": [ 2692 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682, 2692, 2685 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_3_output_0", "outputIndexes": [ 2693 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_1_output_0", "outputIndexes": [ 2694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2694, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680, 2695, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_3_output_0", "outputIndexes": [ 2696 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2696 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_1_output_0", "outputIndexes": [ 2697 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2694, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2698 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680, 22, 2698, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_2_output_0", "outputIndexes": [ 2699 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2697, 2699 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_4_output_0", "outputIndexes": [ 2700 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_3_output_0", "outputIndexes": [ 2701 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2681, 2701 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_1_output_0", "outputIndexes": [ 2702 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3712 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1752252830, 655382, 163840, 0, 0 ] } , "name": "/layers.29/self_attn/v_proj/Linear", "outputIndexes": [ 3721 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3721 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3722 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3722 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2703 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2704 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2705 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2704, 2705, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_2_output_0", "outputIndexes": [ 2706 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2703, 2706 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_2_output_0", "outputIndexes": [ 2707 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2675, 2702, 2707, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.29/self_attn/Reshape_7_output_0", "outputIndexes": [ 2708 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3723 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3723 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3724 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3724 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1753072052, 3276822, 819200, 0, 0 ] } , "name": "/layers.29/self_attn/o_proj/Linear", "outputIndexes": [ 3725 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3725 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3726 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3726 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2709 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 2709 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_output_0", "outputIndexes": [ 2710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1757168074, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.29/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2711 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2711 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3727 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3727 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3728 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3728 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1757188554, 13434902, 3358720, 0, 0 ] } , "name": "/layers.29/mlp/gate_proj/Linear", "outputIndexes": [ 3729 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3729 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3730 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3730 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2712 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2712 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.29/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2713 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3728 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1773982176, 13434902, 3358720, 0, 0 ] } , "name": "/layers.29/mlp/up_proj/Linear", "outputIndexes": [ 3733 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3733 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3734 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3734 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2714 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 2714 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/mlp/Mul_output_0", "outputIndexes": [ 2715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3735 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3736 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3736 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1790775798, 13434902, 3358720, 0, 0 ] } , "name": "/layers.29/mlp/down_proj/Linear", "outputIndexes": [ 3737 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3738 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3738 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710, 2716 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_1_output_0", "outputIndexes": [ 2717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/Reshape_output_0", "outputIndexes": [ 2718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2718 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1807569420, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.30/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2719 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3739 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3740 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3740 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1807589900, 3276822, 819200, 0, 0 ] } , "name": "/layers.30/self_attn/q_proj/Linear", "outputIndexes": [ 3741 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3741 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3742 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3742 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_output_0", "outputIndexes": [ 2721 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2721 ] , "main_type": "NONE", "name": "Shape11240", "outputIndexes": [ 2722 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2721 ] , "main_type": "NONE", "name": "Rank11242", "outputIndexes": [ 2723 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2723, 2723 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11244", "outputIndexes": [ 2724 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11245", "outputIndexes": [ 2725 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11247", "outputIndexes": [ 2726 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11248", "outputIndexes": [ 2727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 2725, 2727, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11251", "outputIndexes": [ 2728 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2728 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11252", "outputIndexes": [ 2729 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2729, 2729 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11254", "outputIndexes": [ 2730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721, 2730, 2724 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_output_0", "outputIndexes": [ 2731 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2731, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2732 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11262", "outputIndexes": [ 2733 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11265", "outputIndexes": [ 2734 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 2733, 2734, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11268", "outputIndexes": [ 2735 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11269", "outputIndexes": [ 2736 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2736 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11270", "outputIndexes": [ 2737 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737, 2736 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11271", "outputIndexes": [ 2738 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721, 2738, 2724 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_1_output_0", "outputIndexes": [ 2739 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2740 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2732, 2740, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_output_0", "outputIndexes": [ 2741 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720, 2741 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_output_0", "outputIndexes": [ 2742 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_output_0", "outputIndexes": [ 2743 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_2_output_0", "outputIndexes": [ 2744 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2744 ] , "main_type": "NONE", "name": "Shape11372", "outputIndexes": [ 2745 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2744 ] , "main_type": "NONE", "name": "Rank11374", "outputIndexes": [ 2746 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2746, 2746 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11376", "outputIndexes": [ 2747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11377", "outputIndexes": [ 2748 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11379", "outputIndexes": [ 2749 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11380", "outputIndexes": [ 2750 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2745, 2748, 2750, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11383", "outputIndexes": [ 2751 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2751 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11384", "outputIndexes": [ 2752 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2752 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11385", "outputIndexes": [ 2753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2753, 2752 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11386", "outputIndexes": [ 2754 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744, 2754, 2747 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_2_output_0", "outputIndexes": [ 2755 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_output_0", "outputIndexes": [ 2756 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2757 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742, 2757, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_1_output_0", "outputIndexes": [ 2758 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2758 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_output_0", "outputIndexes": [ 2759 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2760 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742, 22, 2760, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_output_0", "outputIndexes": [ 2761 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2759, 2761 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_3_output_0", "outputIndexes": [ 2762 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_1_output_0", "outputIndexes": [ 2763 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2743, 2763 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_output_0", "outputIndexes": [ 2764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3740 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1811685922, 655382, 163840, 0, 0 ] } , "name": "/layers.30/self_attn/k_proj/Linear", "outputIndexes": [ 3745 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3745 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3746 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3746 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2765 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2731, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2766 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766, 2767, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_1_output_0", "outputIndexes": [ 2768 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2765, 2768 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_1_output_0", "outputIndexes": [ 2769 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_2_output_0", "outputIndexes": [ 2770 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_3_output_0", "outputIndexes": [ 2771 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2771 ] , "main_type": "NONE", "name": "Shape11278", "outputIndexes": [ 2772 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2771 ] , "main_type": "NONE", "name": "Rank11280", "outputIndexes": [ 2773 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2773, 2773 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11282", "outputIndexes": [ 2774 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2774 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11283", "outputIndexes": [ 2775 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2774, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11285", "outputIndexes": [ 2776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2776 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11286", "outputIndexes": [ 2777 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772, 2775, 2777, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11289", "outputIndexes": [ 2778 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11290", "outputIndexes": [ 2779 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2779 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11291", "outputIndexes": [ 2780 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2780, 2779 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11292", "outputIndexes": [ 2781 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771, 2781, 2774 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_3_output_0", "outputIndexes": [ 2782 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2782, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_1_output_0", "outputIndexes": [ 2783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2783, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2784 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 2784, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_3_output_0", "outputIndexes": [ 2785 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2785 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_1_output_0", "outputIndexes": [ 2786 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2783, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2787 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 22, 2787, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_2_output_0", "outputIndexes": [ 2788 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2786, 2788 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_4_output_0", "outputIndexes": [ 2789 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2789, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_3_output_0", "outputIndexes": [ 2790 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2770, 2790 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_1_output_0", "outputIndexes": [ 2791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3740 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1812505144, 655382, 163840, 0, 0 ] } , "name": "/layers.30/self_attn/v_proj/Linear", "outputIndexes": [ 3749 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3749 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3750 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3750 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2792 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2731, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2793 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2793, 2794, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_2_output_0", "outputIndexes": [ 2795 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2792, 2795 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_2_output_0", "outputIndexes": [ 2796 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764, 2791, 2796, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.30/self_attn/Reshape_7_output_0", "outputIndexes": [ 2797 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3751 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3751 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3752 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3752 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1813324366, 3276822, 819200, 0, 0 ] } , "name": "/layers.30/self_attn/o_proj/Linear", "outputIndexes": [ 3753 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3754 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3754 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2798 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2718, 2798 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_output_0", "outputIndexes": [ 2799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1817420388, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.30/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2800 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2800 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3755 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3755 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3756 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3756 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1817440868, 13434902, 3358720, 0, 0 ] } , "name": "/layers.30/mlp/gate_proj/Linear", "outputIndexes": [ 3757 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3757 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3758 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3758 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2801 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2801 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.30/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2802 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3756 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1834234490, 13434902, 3358720, 0, 0 ] } , "name": "/layers.30/mlp/up_proj/Linear", "outputIndexes": [ 3761 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3761 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3762 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3762 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2803 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2802, 2803 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/mlp/Mul_output_0", "outputIndexes": [ 2804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3763 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3763 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3764 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3764 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1851028112, 13434902, 3358720, 0, 0 ] } , "name": "/layers.30/mlp/down_proj/Linear", "outputIndexes": [ 3765 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3765 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3766 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799, 2805 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_1_output_0", "outputIndexes": [ 2806 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/Reshape_output_0", "outputIndexes": [ 2807 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1867821734, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.31/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2808 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3767 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3767 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3768 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1867842214, 3276822, 819200, 0, 0 ] } , "name": "/layers.31/self_attn/q_proj/Linear", "outputIndexes": [ 3769 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3769 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3770 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3770 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_output_0", "outputIndexes": [ 2810 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2810 ] , "main_type": "NONE", "name": "Shape11611", "outputIndexes": [ 2811 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2810 ] , "main_type": "NONE", "name": "Rank11613", "outputIndexes": [ 2812 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2812, 2812 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11615", "outputIndexes": [ 2813 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11616", "outputIndexes": [ 2814 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11618", "outputIndexes": [ 2815 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11619", "outputIndexes": [ 2816 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811, 2814, 2816, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11622", "outputIndexes": [ 2817 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2817 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11623", "outputIndexes": [ 2818 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818, 2818 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11625", "outputIndexes": [ 2819 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810, 2819, 2813 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_output_0", "outputIndexes": [ 2820 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2820, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2821 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11633", "outputIndexes": [ 2822 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11636", "outputIndexes": [ 2823 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811, 2822, 2823, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11639", "outputIndexes": [ 2824 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2824 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11640", "outputIndexes": [ 2825 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2825 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11641", "outputIndexes": [ 2826 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826, 2825 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11642", "outputIndexes": [ 2827 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810, 2827, 2813 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_1_output_0", "outputIndexes": [ 2828 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2821, 2829, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_output_0", "outputIndexes": [ 2830 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2809, 2830 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_output_0", "outputIndexes": [ 2831 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_output_0", "outputIndexes": [ 2832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_2_output_0", "outputIndexes": [ 2833 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2833 ] , "main_type": "NONE", "name": "Shape11712", "outputIndexes": [ 2834 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2833 ] , "main_type": "NONE", "name": "Rank11714", "outputIndexes": [ 2835 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2835, 2835 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11716", "outputIndexes": [ 2836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11717", "outputIndexes": [ 2837 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11719", "outputIndexes": [ 2838 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2838 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11720", "outputIndexes": [ 2839 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2834, 2837, 2839, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11723", "outputIndexes": [ 2840 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2840 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11724", "outputIndexes": [ 2841 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2841 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11725", "outputIndexes": [ 2842 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842, 2841 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11726", "outputIndexes": [ 2843 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833, 2843, 2836 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_2_output_0", "outputIndexes": [ 2844 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2844, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_output_0", "outputIndexes": [ 2845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2846 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831, 2846, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_1_output_0", "outputIndexes": [ 2847 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2847 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_output_0", "outputIndexes": [ 2848 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2849 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831, 22, 2849, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_output_0", "outputIndexes": [ 2850 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2848, 2850 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_3_output_0", "outputIndexes": [ 2851 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2851, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_1_output_0", "outputIndexes": [ 2852 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832, 2852 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_output_0", "outputIndexes": [ 2853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1871938236, 655382, 163840, 0, 0 ] } , "name": "/layers.31/self_attn/k_proj/Linear", "outputIndexes": [ 3773 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3773 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3774 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3774 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2854 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2820, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2855 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2855, 2856, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_1_output_0", "outputIndexes": [ 2857 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2854, 2857 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_1_output_0", "outputIndexes": [ 2858 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_2_output_0", "outputIndexes": [ 2859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_3_output_0", "outputIndexes": [ 2860 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2860 ] , "main_type": "NONE", "name": "Shape11649", "outputIndexes": [ 2861 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2860 ] , "main_type": "NONE", "name": "Rank11651", "outputIndexes": [ 2862 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2862, 2862 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11653", "outputIndexes": [ 2863 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2863 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11654", "outputIndexes": [ 2864 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2863, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11656", "outputIndexes": [ 2865 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2865 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11657", "outputIndexes": [ 2866 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 2864, 2866, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11660", "outputIndexes": [ 2867 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2867 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11661", "outputIndexes": [ 2868 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2868 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11662", "outputIndexes": [ 2869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2869, 2868 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11663", "outputIndexes": [ 2870 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2860, 2870, 2863 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_3_output_0", "outputIndexes": [ 2871 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2871, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_1_output_0", "outputIndexes": [ 2872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2872, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2873 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858, 2873, 77, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_3_output_0", "outputIndexes": [ 2874 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2874 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_1_output_0", "outputIndexes": [ 2875 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2872, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2876 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858, 22, 2876, 78, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_2_output_0", "outputIndexes": [ 2877 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2875, 2877 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_4_output_0", "outputIndexes": [ 2878 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2878, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_3_output_0", "outputIndexes": [ 2879 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859, 2879 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_1_output_0", "outputIndexes": [ 2880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 512, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 20480, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1872757458, 655382, 163840, 0, 0 ] } , "name": "/layers.31/self_attn/v_proj/Linear", "outputIndexes": [ 3777 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3777 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3778 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3778 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 512 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2881 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2820, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2882 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2883 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2882, 2883, 96, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_2_output_0", "outputIndexes": [ 2884 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2881, 2884 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_2_output_0", "outputIndexes": [ 2885 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2853, 2880, 2885, 126 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.31/self_attn/Reshape_7_output_0", "outputIndexes": [ 2886 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2886 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3779 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3779 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3780 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3780 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 102400, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1873576680, 3276822, 819200, 0, 0 ] } , "name": "/layers.31/self_attn/o_proj/Linear", "outputIndexes": [ 3781 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3781 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3782 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3782 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2887 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807, 2887 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_output_0", "outputIndexes": [ 2888 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2888 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1877672702, 10240, 10240 ] , "useRMSNorm": true } , "name": "/blocks.31/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2889 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2889 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3783 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3783 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3784 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3784 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1877693182, 13434902, 3358720, 0, 0 ] } , "name": "/layers.31/mlp/gate_proj/Linear", "outputIndexes": [ 3785 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3785 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3786 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3786 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2890 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2890 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.31/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2891 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3784 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 10496, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1894486804, 13434902, 3358720, 0, 0 ] } , "name": "/layers.31/mlp/up_proj/Linear", "outputIndexes": [ 3789 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3789 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3790 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3790 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 10496 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2892 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2891, 2892 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/mlp/Mul_output_0", "outputIndexes": [ 2893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2893 ] , "main_type": "Reshape", "main": { "dims": [ -1, 10496, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3791 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3791 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3792 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3792 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 10496, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 419840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1911280426, 13434902, 3358720, 0, 0 ] } , "name": "/layers.31/mlp/down_proj/Linear", "outputIndexes": [ 3793 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3794 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3794 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2894 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2888, 2894 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_1_output_0", "outputIndexes": [ 2895 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2895, 3, 77, 17, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 2896 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2896 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1928074048, 10240, 10240 ] , "useRMSNorm": true } , "name": "hidden_states", "outputIndexes": [ 2897 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2897 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 3795 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3795 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 3796 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3796 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 166144, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 6645760, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 1928094528, 212664346, 53166080, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 3797 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3797 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 3798 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3798 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 166144 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 2898 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "hidden_states", "presents" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "past_key_values", "presents", "position_ids", "logits_index", "input_ids", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape51", "Rank53", "BinaryOp55", "Unsqueeze56", "Const9", "BinaryOp58", "Unsqueeze59", "Unsqueeze61", "StridedSlice62", "Squeeze63", "BinaryOp65", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_4_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze75", "Unsqueeze78", "StridedSlice81", "Squeeze82", "BinaryOp83", "BinaryOp84", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_2_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_7_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape107", "Rank109", "BinaryOp111", "Unsqueeze112", "BinaryOp114", "Unsqueeze115", "StridedSlice118", "Squeeze119", "BinaryOp121", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_10_output_0", "Shape239", "Rank241", "BinaryOp243", "Unsqueeze244", "BinaryOp246", "Unsqueeze247", "StridedSlice250", "Squeeze251", "BinaryOp252", "BinaryOp253", "/blocks.0/self_attn/Gather_4_output_0", "/rotary/Constant_6_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_19_output_0", "/blocks.0/self_attn/Constant_13_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze158", "Unsqueeze161", "StridedSlice164", "Squeeze165", "BinaryOp166", "BinaryOp167", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Constant_6_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape126", "Rank128", "BinaryOp130", "Unsqueeze131", "BinaryOp133", "Unsqueeze134", "StridedSlice137", "Squeeze138", "BinaryOp139", "BinaryOp140", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "/blocks.0/self_attn/Reshape_7_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/Add_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape484", "Rank486", "BinaryOp488", "Unsqueeze489", "BinaryOp491", "Unsqueeze492", "StridedSlice495", "Squeeze496", "BinaryOp498", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze506", "Unsqueeze509", "StridedSlice512", "Squeeze513", "BinaryOp514", "BinaryOp515", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape615", "Rank617", "BinaryOp619", "Unsqueeze620", "BinaryOp622", "Unsqueeze623", "StridedSlice626", "Squeeze627", "BinaryOp628", "BinaryOp629", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape522", "Rank524", "BinaryOp526", "Unsqueeze527", "BinaryOp529", "Unsqueeze530", "StridedSlice533", "Squeeze534", "BinaryOp535", "BinaryOp536", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "/blocks.1/self_attn/Reshape_7_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/Add_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape854", "Rank856", "BinaryOp858", "Unsqueeze859", "BinaryOp861", "Unsqueeze862", "StridedSlice865", "Squeeze866", "BinaryOp868", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze876", "Unsqueeze879", "StridedSlice882", "Squeeze883", "BinaryOp884", "BinaryOp885", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape985", "Rank987", "BinaryOp989", "Unsqueeze990", "BinaryOp992", "Unsqueeze993", "StridedSlice996", "Squeeze997", "BinaryOp998", "BinaryOp999", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape892", "Rank894", "BinaryOp896", "Unsqueeze897", "BinaryOp899", "Unsqueeze900", "StridedSlice903", "Squeeze904", "BinaryOp905", "BinaryOp906", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "/blocks.2/self_attn/Reshape_7_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/Add_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape1224", "Rank1226", "BinaryOp1228", "Unsqueeze1229", "BinaryOp1231", "Unsqueeze1232", "StridedSlice1235", "Squeeze1236", "BinaryOp1238", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze1246", "Unsqueeze1249", "StridedSlice1252", "Squeeze1253", "BinaryOp1254", "BinaryOp1255", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape1356", "Rank1358", "BinaryOp1360", "Unsqueeze1361", "BinaryOp1363", "Unsqueeze1364", "StridedSlice1367", "Squeeze1368", "BinaryOp1369", "BinaryOp1370", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape1262", "Rank1264", "BinaryOp1266", "Unsqueeze1267", "BinaryOp1269", "Unsqueeze1270", "StridedSlice1273", "Squeeze1274", "BinaryOp1275", "BinaryOp1276", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "/blocks.3/self_attn/Reshape_7_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/Add_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape1595", "Rank1597", "BinaryOp1599", "Unsqueeze1600", "BinaryOp1602", "Unsqueeze1603", "StridedSlice1606", "Squeeze1607", "BinaryOp1609", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze1617", "Unsqueeze1620", "StridedSlice1623", "Squeeze1624", "BinaryOp1625", "BinaryOp1626", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape1726", "Rank1728", "BinaryOp1730", "Unsqueeze1731", "BinaryOp1733", "Unsqueeze1734", "StridedSlice1737", "Squeeze1738", "BinaryOp1739", "BinaryOp1740", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape1633", "Rank1635", "BinaryOp1637", "Unsqueeze1638", "BinaryOp1640", "Unsqueeze1641", "StridedSlice1644", "Squeeze1645", "BinaryOp1646", "BinaryOp1647", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "/blocks.4/self_attn/Reshape_7_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/Add_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape1965", "Rank1967", "BinaryOp1969", "Unsqueeze1970", "BinaryOp1972", "Unsqueeze1973", "StridedSlice1976", "Squeeze1977", "BinaryOp1979", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze1987", "Unsqueeze1990", "StridedSlice1993", "Squeeze1994", "BinaryOp1995", "BinaryOp1996", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape2097", "Rank2099", "BinaryOp2101", "Unsqueeze2102", "BinaryOp2104", "Unsqueeze2105", "StridedSlice2108", "Squeeze2109", "BinaryOp2110", "BinaryOp2111", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape2003", "Rank2005", "BinaryOp2007", "Unsqueeze2008", "BinaryOp2010", "Unsqueeze2011", "StridedSlice2014", "Squeeze2015", "BinaryOp2016", "BinaryOp2017", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "/blocks.5/self_attn/Reshape_7_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/Add_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape2336", "Rank2338", "BinaryOp2340", "Unsqueeze2341", "BinaryOp2343", "Unsqueeze2344", "StridedSlice2347", "Squeeze2348", "BinaryOp2350", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze2358", "Unsqueeze2361", "StridedSlice2364", "Squeeze2365", "BinaryOp2366", "BinaryOp2367", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape2468", "Rank2470", "BinaryOp2472", "Unsqueeze2473", "BinaryOp2475", "Unsqueeze2476", "StridedSlice2479", "Squeeze2480", "BinaryOp2481", "BinaryOp2482", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape2374", "Rank2376", "BinaryOp2378", "Unsqueeze2379", "BinaryOp2381", "Unsqueeze2382", "StridedSlice2385", "Squeeze2386", "BinaryOp2387", "BinaryOp2388", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "/blocks.6/self_attn/Reshape_7_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/Add_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape2707", "Rank2709", "BinaryOp2711", "Unsqueeze2712", "BinaryOp2714", "Unsqueeze2715", "StridedSlice2718", "Squeeze2719", "BinaryOp2721", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze2729", "Unsqueeze2732", "StridedSlice2735", "Squeeze2736", "BinaryOp2737", "BinaryOp2738", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape2839", "Rank2841", "BinaryOp2843", "Unsqueeze2844", "BinaryOp2846", "Unsqueeze2847", "StridedSlice2850", "Squeeze2851", "BinaryOp2852", "BinaryOp2853", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape2745", "Rank2747", "BinaryOp2749", "Unsqueeze2750", "BinaryOp2752", "Unsqueeze2753", "StridedSlice2756", "Squeeze2757", "BinaryOp2758", "BinaryOp2759", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "/blocks.7/self_attn/Reshape_7_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/Add_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape3078", "Rank3080", "BinaryOp3082", "Unsqueeze3083", "BinaryOp3085", "Unsqueeze3086", "StridedSlice3089", "Squeeze3090", "BinaryOp3092", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze3100", "Unsqueeze3103", "StridedSlice3106", "Squeeze3107", "BinaryOp3108", "BinaryOp3109", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape3210", "Rank3212", "BinaryOp3214", "Unsqueeze3215", "BinaryOp3217", "Unsqueeze3218", "StridedSlice3221", "Squeeze3222", "BinaryOp3223", "BinaryOp3224", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape3116", "Rank3118", "BinaryOp3120", "Unsqueeze3121", "BinaryOp3123", "Unsqueeze3124", "StridedSlice3127", "Squeeze3128", "BinaryOp3129", "BinaryOp3130", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "/blocks.8/self_attn/Reshape_7_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/Add_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape3449", "Rank3451", "BinaryOp3453", "Unsqueeze3454", "BinaryOp3456", "Unsqueeze3457", "StridedSlice3460", "Squeeze3461", "BinaryOp3463", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze3471", "Unsqueeze3474", "StridedSlice3477", "Squeeze3478", "BinaryOp3479", "BinaryOp3480", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape3581", "Rank3583", "BinaryOp3585", "Unsqueeze3586", "BinaryOp3588", "Unsqueeze3589", "StridedSlice3592", "Squeeze3593", "BinaryOp3594", "BinaryOp3595", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape3487", "Rank3489", "BinaryOp3491", "Unsqueeze3492", "BinaryOp3494", "Unsqueeze3495", "StridedSlice3498", "Squeeze3499", "BinaryOp3500", "BinaryOp3501", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "/blocks.9/self_attn/Reshape_7_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/Add_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape3820", "Rank3822", "BinaryOp3824", "Unsqueeze3825", "BinaryOp3827", "Unsqueeze3828", "StridedSlice3831", "Squeeze3832", "BinaryOp3834", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze3842", "Unsqueeze3845", "StridedSlice3848", "Squeeze3849", "BinaryOp3850", "BinaryOp3851", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape3952", "Rank3954", "BinaryOp3956", "Unsqueeze3957", "BinaryOp3959", "Unsqueeze3960", "StridedSlice3963", "Squeeze3964", "BinaryOp3965", "BinaryOp3966", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape3858", "Rank3860", "BinaryOp3862", "Unsqueeze3863", "BinaryOp3865", "Unsqueeze3866", "StridedSlice3869", "Squeeze3870", "BinaryOp3871", "BinaryOp3872", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "/blocks.10/self_attn/Reshape_7_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/Add_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape4191", "Rank4193", "BinaryOp4195", "Unsqueeze4196", "BinaryOp4198", "Unsqueeze4199", "StridedSlice4202", "Squeeze4203", "BinaryOp4205", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze4213", "Unsqueeze4216", "StridedSlice4219", "Squeeze4220", "BinaryOp4221", "BinaryOp4222", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape4323", "Rank4325", "BinaryOp4327", "Unsqueeze4328", "BinaryOp4330", "Unsqueeze4331", "StridedSlice4334", "Squeeze4335", "BinaryOp4336", "BinaryOp4337", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape4229", "Rank4231", "BinaryOp4233", "Unsqueeze4234", "BinaryOp4236", "Unsqueeze4237", "StridedSlice4240", "Squeeze4241", "BinaryOp4242", "BinaryOp4243", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "/blocks.11/self_attn/Reshape_7_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/Add_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape4562", "Rank4564", "BinaryOp4566", "Unsqueeze4567", "BinaryOp4569", "Unsqueeze4570", "StridedSlice4573", "Squeeze4574", "BinaryOp4576", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze4584", "Unsqueeze4587", "StridedSlice4590", "Squeeze4591", "BinaryOp4592", "BinaryOp4593", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape4694", "Rank4696", "BinaryOp4698", "Unsqueeze4699", "BinaryOp4701", "Unsqueeze4702", "StridedSlice4705", "Squeeze4706", "BinaryOp4707", "BinaryOp4708", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape4600", "Rank4602", "BinaryOp4604", "Unsqueeze4605", "BinaryOp4607", "Unsqueeze4608", "StridedSlice4611", "Squeeze4612", "BinaryOp4613", "BinaryOp4614", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "/blocks.12/self_attn/Reshape_7_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/Add_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape4933", "Rank4935", "BinaryOp4937", "Unsqueeze4938", "BinaryOp4940", "Unsqueeze4941", "StridedSlice4944", "Squeeze4945", "BinaryOp4947", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze4955", "Unsqueeze4958", "StridedSlice4961", "Squeeze4962", "BinaryOp4963", "BinaryOp4964", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape5065", "Rank5067", "BinaryOp5069", "Unsqueeze5070", "BinaryOp5072", "Unsqueeze5073", "StridedSlice5076", "Squeeze5077", "BinaryOp5078", "BinaryOp5079", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape4971", "Rank4973", "BinaryOp4975", "Unsqueeze4976", "BinaryOp4978", "Unsqueeze4979", "StridedSlice4982", "Squeeze4983", "BinaryOp4984", "BinaryOp4985", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "/blocks.13/self_attn/Reshape_7_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/Add_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape5304", "Rank5306", "BinaryOp5308", "Unsqueeze5309", "BinaryOp5311", "Unsqueeze5312", "StridedSlice5315", "Squeeze5316", "BinaryOp5318", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze5326", "Unsqueeze5329", "StridedSlice5332", "Squeeze5333", "BinaryOp5334", "BinaryOp5335", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape5436", "Rank5438", "BinaryOp5440", "Unsqueeze5441", "BinaryOp5443", "Unsqueeze5444", "StridedSlice5447", "Squeeze5448", "BinaryOp5449", "BinaryOp5450", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape5342", "Rank5344", "BinaryOp5346", "Unsqueeze5347", "BinaryOp5349", "Unsqueeze5350", "StridedSlice5353", "Squeeze5354", "BinaryOp5355", "BinaryOp5356", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "/blocks.14/self_attn/Reshape_7_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/Add_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape5675", "Rank5677", "BinaryOp5679", "Unsqueeze5680", "BinaryOp5682", "Unsqueeze5683", "StridedSlice5686", "Squeeze5687", "BinaryOp5689", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze5697", "Unsqueeze5700", "StridedSlice5703", "Squeeze5704", "BinaryOp5705", "BinaryOp5706", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape5807", "Rank5809", "BinaryOp5811", "Unsqueeze5812", "BinaryOp5814", "Unsqueeze5815", "StridedSlice5818", "Squeeze5819", "BinaryOp5820", "BinaryOp5821", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape5713", "Rank5715", "BinaryOp5717", "Unsqueeze5718", "BinaryOp5720", "Unsqueeze5721", "StridedSlice5724", "Squeeze5725", "BinaryOp5726", "BinaryOp5727", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "/blocks.15/self_attn/Reshape_7_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/Add_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape6046", "Rank6048", "BinaryOp6050", "Unsqueeze6051", "BinaryOp6053", "Unsqueeze6054", "StridedSlice6057", "Squeeze6058", "BinaryOp6060", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze6068", "Unsqueeze6071", "StridedSlice6074", "Squeeze6075", "BinaryOp6076", "BinaryOp6077", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape6178", "Rank6180", "BinaryOp6182", "Unsqueeze6183", "BinaryOp6185", "Unsqueeze6186", "StridedSlice6189", "Squeeze6190", "BinaryOp6191", "BinaryOp6192", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape6084", "Rank6086", "BinaryOp6088", "Unsqueeze6089", "BinaryOp6091", "Unsqueeze6092", "StridedSlice6095", "Squeeze6096", "BinaryOp6097", "BinaryOp6098", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "/blocks.16/self_attn/Reshape_7_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/Add_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape6417", "Rank6419", "BinaryOp6421", "Unsqueeze6422", "BinaryOp6424", "Unsqueeze6425", "StridedSlice6428", "Squeeze6429", "BinaryOp6431", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze6439", "Unsqueeze6442", "StridedSlice6445", "Squeeze6446", "BinaryOp6447", "BinaryOp6448", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape6549", "Rank6551", "BinaryOp6553", "Unsqueeze6554", "BinaryOp6556", "Unsqueeze6557", "StridedSlice6560", "Squeeze6561", "BinaryOp6562", "BinaryOp6563", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape6455", "Rank6457", "BinaryOp6459", "Unsqueeze6460", "BinaryOp6462", "Unsqueeze6463", "StridedSlice6466", "Squeeze6467", "BinaryOp6468", "BinaryOp6469", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "/blocks.17/self_attn/Reshape_7_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/Add_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape6788", "Rank6790", "BinaryOp6792", "Unsqueeze6793", "BinaryOp6795", "Unsqueeze6796", "StridedSlice6799", "Squeeze6800", "BinaryOp6802", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze6810", "Unsqueeze6813", "StridedSlice6816", "Squeeze6817", "BinaryOp6818", "BinaryOp6819", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape6920", "Rank6922", "BinaryOp6924", "Unsqueeze6925", "BinaryOp6927", "Unsqueeze6928", "StridedSlice6931", "Squeeze6932", "BinaryOp6933", "BinaryOp6934", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape6826", "Rank6828", "BinaryOp6830", "Unsqueeze6831", "BinaryOp6833", "Unsqueeze6834", "StridedSlice6837", "Squeeze6838", "BinaryOp6839", "BinaryOp6840", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "/blocks.18/self_attn/Reshape_7_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/Add_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape7159", "Rank7161", "BinaryOp7163", "Unsqueeze7164", "BinaryOp7166", "Unsqueeze7167", "StridedSlice7170", "Squeeze7171", "BinaryOp7173", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze7181", "Unsqueeze7184", "StridedSlice7187", "Squeeze7188", "BinaryOp7189", "BinaryOp7190", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape7291", "Rank7293", "BinaryOp7295", "Unsqueeze7296", "BinaryOp7298", "Unsqueeze7299", "StridedSlice7302", "Squeeze7303", "BinaryOp7304", "BinaryOp7305", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape7197", "Rank7199", "BinaryOp7201", "Unsqueeze7202", "BinaryOp7204", "Unsqueeze7205", "StridedSlice7208", "Squeeze7209", "BinaryOp7210", "BinaryOp7211", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "/blocks.19/self_attn/Reshape_7_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/Add_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape7530", "Rank7532", "BinaryOp7534", "Unsqueeze7535", "BinaryOp7537", "Unsqueeze7538", "StridedSlice7541", "Squeeze7542", "BinaryOp7544", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze7552", "Unsqueeze7555", "StridedSlice7558", "Squeeze7559", "BinaryOp7560", "BinaryOp7561", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape7662", "Rank7664", "BinaryOp7666", "Unsqueeze7667", "BinaryOp7669", "Unsqueeze7670", "StridedSlice7673", "Squeeze7674", "BinaryOp7675", "BinaryOp7676", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape7568", "Rank7570", "BinaryOp7572", "Unsqueeze7573", "BinaryOp7575", "Unsqueeze7576", "StridedSlice7579", "Squeeze7580", "BinaryOp7581", "BinaryOp7582", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "/blocks.20/self_attn/Reshape_7_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/Add_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape7901", "Rank7903", "BinaryOp7905", "Unsqueeze7906", "BinaryOp7908", "Unsqueeze7909", "StridedSlice7912", "Squeeze7913", "BinaryOp7915", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze7923", "Unsqueeze7926", "StridedSlice7929", "Squeeze7930", "BinaryOp7931", "BinaryOp7932", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape8033", "Rank8035", "BinaryOp8037", "Unsqueeze8038", "BinaryOp8040", "Unsqueeze8041", "StridedSlice8044", "Squeeze8045", "BinaryOp8046", "BinaryOp8047", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape7939", "Rank7941", "BinaryOp7943", "Unsqueeze7944", "BinaryOp7946", "Unsqueeze7947", "StridedSlice7950", "Squeeze7951", "BinaryOp7952", "BinaryOp7953", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "/blocks.21/self_attn/Reshape_7_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/Add_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape8272", "Rank8274", "BinaryOp8276", "Unsqueeze8277", "BinaryOp8279", "Unsqueeze8280", "StridedSlice8283", "Squeeze8284", "BinaryOp8286", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze8294", "Unsqueeze8297", "StridedSlice8300", "Squeeze8301", "BinaryOp8302", "BinaryOp8303", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape8404", "Rank8406", "BinaryOp8408", "Unsqueeze8409", "BinaryOp8411", "Unsqueeze8412", "StridedSlice8415", "Squeeze8416", "BinaryOp8417", "BinaryOp8418", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape8310", "Rank8312", "BinaryOp8314", "Unsqueeze8315", "BinaryOp8317", "Unsqueeze8318", "StridedSlice8321", "Squeeze8322", "BinaryOp8323", "BinaryOp8324", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "/blocks.22/self_attn/Reshape_7_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/Add_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape8643", "Rank8645", "BinaryOp8647", "Unsqueeze8648", "BinaryOp8650", "Unsqueeze8651", "StridedSlice8654", "Squeeze8655", "BinaryOp8657", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze8665", "Unsqueeze8668", "StridedSlice8671", "Squeeze8672", "BinaryOp8673", "BinaryOp8674", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape8775", "Rank8777", "BinaryOp8779", "Unsqueeze8780", "BinaryOp8782", "Unsqueeze8783", "StridedSlice8786", "Squeeze8787", "BinaryOp8788", "BinaryOp8789", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape8681", "Rank8683", "BinaryOp8685", "Unsqueeze8686", "BinaryOp8688", "Unsqueeze8689", "StridedSlice8692", "Squeeze8693", "BinaryOp8694", "BinaryOp8695", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "/blocks.23/self_attn/Reshape_7_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/Add_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape9014", "Rank9016", "BinaryOp9018", "Unsqueeze9019", "BinaryOp9021", "Unsqueeze9022", "StridedSlice9025", "Squeeze9026", "BinaryOp9028", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze9036", "Unsqueeze9039", "StridedSlice9042", "Squeeze9043", "BinaryOp9044", "BinaryOp9045", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape9146", "Rank9148", "BinaryOp9150", "Unsqueeze9151", "BinaryOp9153", "Unsqueeze9154", "StridedSlice9157", "Squeeze9158", "BinaryOp9159", "BinaryOp9160", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape9052", "Rank9054", "BinaryOp9056", "Unsqueeze9057", "BinaryOp9059", "Unsqueeze9060", "StridedSlice9063", "Squeeze9064", "BinaryOp9065", "BinaryOp9066", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "/blocks.24/self_attn/Reshape_7_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/Add_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape9385", "Rank9387", "BinaryOp9389", "Unsqueeze9390", "BinaryOp9392", "Unsqueeze9393", "StridedSlice9396", "Squeeze9397", "BinaryOp9399", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze9407", "Unsqueeze9410", "StridedSlice9413", "Squeeze9414", "BinaryOp9415", "BinaryOp9416", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape9517", "Rank9519", "BinaryOp9521", "Unsqueeze9522", "BinaryOp9524", "Unsqueeze9525", "StridedSlice9528", "Squeeze9529", "BinaryOp9530", "BinaryOp9531", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape9423", "Rank9425", "BinaryOp9427", "Unsqueeze9428", "BinaryOp9430", "Unsqueeze9431", "StridedSlice9434", "Squeeze9435", "BinaryOp9436", "BinaryOp9437", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "/blocks.25/self_attn/Reshape_7_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/Add_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/Add_1_output_0", "/blocks.26/Reshape_output_0", "/blocks.26/input_layernorm/Mul_1_output_0", "/blocks.26/self_attn/q_proj/FakeLinear_output_0", "/blocks.26/self_attn/Shape_output_0", "Shape9756", "Rank9758", "BinaryOp9760", "Unsqueeze9761", "BinaryOp9763", "Unsqueeze9764", "StridedSlice9767", "Squeeze9768", "BinaryOp9770", "/blocks.26/self_attn/Gather_output_0", "/blocks.26/self_attn/Unsqueeze_output_0", "Unsqueeze9778", "Unsqueeze9781", "StridedSlice9784", "Squeeze9785", "BinaryOp9786", "BinaryOp9787", "/blocks.26/self_attn/Gather_1_output_0", "/blocks.26/self_attn/Unsqueeze_1_output_0", "/blocks.26/self_attn/Concat_output_0", "/blocks.26/self_attn/Reshape_output_0", "/blocks.26/self_attn/Mul_output_0", "/blocks.26/self_attn/Shape_2_output_0", "Shape9888", "Rank9890", "BinaryOp9892", "Unsqueeze9893", "BinaryOp9895", "Unsqueeze9896", "StridedSlice9899", "Squeeze9900", "BinaryOp9901", "BinaryOp9902", "/blocks.26/self_attn/Gather_2_output_0", "/blocks.26/self_attn/Div_output_0", "/blocks.26/self_attn/Unsqueeze_7_output_0", "/blocks.26/self_attn/Slice_1_output_0", "/blocks.26/self_attn/Neg_output_0", "/blocks.26/self_attn/Unsqueeze_6_output_0", "/blocks.26/self_attn/Slice_output_0", "/blocks.26/self_attn/Concat_3_output_0", "/blocks.26/self_attn/Mul_1_output_0", "/blocks.26/self_attn/Add_output_0", "/blocks.26/self_attn/k_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_2_output_0", "/blocks.26/self_attn/Unsqueeze_3_output_0", "/blocks.26/self_attn/Concat_1_output_0", "/blocks.26/self_attn/Reshape_1_output_0", "/blocks.26/self_attn/Mul_2_output_0", "/blocks.26/self_attn/Shape_3_output_0", "Shape9794", "Rank9796", "BinaryOp9798", "Unsqueeze9799", "BinaryOp9801", "Unsqueeze9802", "StridedSlice9805", "Squeeze9806", "BinaryOp9807", "BinaryOp9808", "/blocks.26/self_attn/Gather_3_output_0", "/blocks.26/self_attn/Div_1_output_0", "/blocks.26/self_attn/Unsqueeze_9_output_0", "/blocks.26/self_attn/Slice_3_output_0", "/blocks.26/self_attn/Neg_1_output_0", "/blocks.26/self_attn/Unsqueeze_8_output_0", "/blocks.26/self_attn/Slice_2_output_0", "/blocks.26/self_attn/Concat_4_output_0", "/blocks.26/self_attn/Mul_3_output_0", "/blocks.26/self_attn/Add_1_output_0", "/blocks.26/self_attn/v_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_4_output_0", "/blocks.26/self_attn/Unsqueeze_5_output_0", "/blocks.26/self_attn/Concat_2_output_0", "/blocks.26/self_attn/Reshape_2_output_0", "/blocks.26/self_attn/Reshape_7_output_0", "/blocks.26/self_attn/o_proj/FakeLinear_output_0", "/blocks.26/Add_output_0", "/blocks.26/post_attention_layernorm/Mul_1_output_0", "/blocks.26/mlp/gate_proj/FakeLinear_output_0", "/blocks.26/mlp/act_fn/Mul_output_0", "/blocks.26/mlp/up_proj/FakeLinear_output_0", "/blocks.26/mlp/Mul_output_0", "/blocks.26/mlp/down_proj/FakeLinear_output_0", "/blocks.26/Add_1_output_0", "/blocks.27/Reshape_output_0", "/blocks.27/input_layernorm/Mul_1_output_0", "/blocks.27/self_attn/q_proj/FakeLinear_output_0", "/blocks.27/self_attn/Shape_output_0", "Shape10127", "Rank10129", "BinaryOp10131", "Unsqueeze10132", "BinaryOp10134", "Unsqueeze10135", "StridedSlice10138", "Squeeze10139", "BinaryOp10141", "/blocks.27/self_attn/Gather_output_0", "/blocks.27/self_attn/Unsqueeze_output_0", "Unsqueeze10149", "Unsqueeze10152", "StridedSlice10155", "Squeeze10156", "BinaryOp10157", "BinaryOp10158", "/blocks.27/self_attn/Gather_1_output_0", "/blocks.27/self_attn/Unsqueeze_1_output_0", "/blocks.27/self_attn/Concat_output_0", "/blocks.27/self_attn/Reshape_output_0", "/blocks.27/self_attn/Mul_output_0", "/blocks.27/self_attn/Shape_2_output_0", "Shape10259", "Rank10261", "BinaryOp10263", "Unsqueeze10264", "BinaryOp10266", "Unsqueeze10267", "StridedSlice10270", "Squeeze10271", "BinaryOp10272", "BinaryOp10273", "/blocks.27/self_attn/Gather_2_output_0", "/blocks.27/self_attn/Div_output_0", "/blocks.27/self_attn/Unsqueeze_7_output_0", "/blocks.27/self_attn/Slice_1_output_0", "/blocks.27/self_attn/Neg_output_0", "/blocks.27/self_attn/Unsqueeze_6_output_0", "/blocks.27/self_attn/Slice_output_0", "/blocks.27/self_attn/Concat_3_output_0", "/blocks.27/self_attn/Mul_1_output_0", "/blocks.27/self_attn/Add_output_0", "/blocks.27/self_attn/k_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_2_output_0", "/blocks.27/self_attn/Unsqueeze_3_output_0", "/blocks.27/self_attn/Concat_1_output_0", "/blocks.27/self_attn/Reshape_1_output_0", "/blocks.27/self_attn/Mul_2_output_0", "/blocks.27/self_attn/Shape_3_output_0", "Shape10165", "Rank10167", "BinaryOp10169", "Unsqueeze10170", "BinaryOp10172", "Unsqueeze10173", "StridedSlice10176", "Squeeze10177", "BinaryOp10178", "BinaryOp10179", "/blocks.27/self_attn/Gather_3_output_0", "/blocks.27/self_attn/Div_1_output_0", "/blocks.27/self_attn/Unsqueeze_9_output_0", "/blocks.27/self_attn/Slice_3_output_0", "/blocks.27/self_attn/Neg_1_output_0", "/blocks.27/self_attn/Unsqueeze_8_output_0", "/blocks.27/self_attn/Slice_2_output_0", "/blocks.27/self_attn/Concat_4_output_0", "/blocks.27/self_attn/Mul_3_output_0", "/blocks.27/self_attn/Add_1_output_0", "/blocks.27/self_attn/v_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_4_output_0", "/blocks.27/self_attn/Unsqueeze_5_output_0", "/blocks.27/self_attn/Concat_2_output_0", "/blocks.27/self_attn/Reshape_2_output_0", "/blocks.27/self_attn/Reshape_7_output_0", "/blocks.27/self_attn/o_proj/FakeLinear_output_0", "/blocks.27/Add_output_0", "/blocks.27/post_attention_layernorm/Mul_1_output_0", "/blocks.27/mlp/gate_proj/FakeLinear_output_0", "/blocks.27/mlp/act_fn/Mul_output_0", "/blocks.27/mlp/up_proj/FakeLinear_output_0", "/blocks.27/mlp/Mul_output_0", "/blocks.27/mlp/down_proj/FakeLinear_output_0", "/blocks.27/Add_1_output_0", "/blocks.28/Reshape_output_0", "/blocks.28/input_layernorm/Mul_1_output_0", "/blocks.28/self_attn/q_proj/FakeLinear_output_0", "/blocks.28/self_attn/Shape_output_0", "Shape10498", "Rank10500", "BinaryOp10502", "Unsqueeze10503", "BinaryOp10505", "Unsqueeze10506", "StridedSlice10509", "Squeeze10510", "BinaryOp10512", "/blocks.28/self_attn/Gather_output_0", "/blocks.28/self_attn/Unsqueeze_output_0", "Unsqueeze10520", "Unsqueeze10523", "StridedSlice10526", "Squeeze10527", "BinaryOp10528", "BinaryOp10529", "/blocks.28/self_attn/Gather_1_output_0", "/blocks.28/self_attn/Unsqueeze_1_output_0", "/blocks.28/self_attn/Concat_output_0", "/blocks.28/self_attn/Reshape_output_0", "/blocks.28/self_attn/Mul_output_0", "/blocks.28/self_attn/Shape_2_output_0", "Shape10630", "Rank10632", "BinaryOp10634", "Unsqueeze10635", "BinaryOp10637", "Unsqueeze10638", "StridedSlice10641", "Squeeze10642", "BinaryOp10643", "BinaryOp10644", "/blocks.28/self_attn/Gather_2_output_0", "/blocks.28/self_attn/Div_output_0", "/blocks.28/self_attn/Unsqueeze_7_output_0", "/blocks.28/self_attn/Slice_1_output_0", "/blocks.28/self_attn/Neg_output_0", "/blocks.28/self_attn/Unsqueeze_6_output_0", "/blocks.28/self_attn/Slice_output_0", "/blocks.28/self_attn/Concat_3_output_0", "/blocks.28/self_attn/Mul_1_output_0", "/blocks.28/self_attn/Add_output_0", "/blocks.28/self_attn/k_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_2_output_0", "/blocks.28/self_attn/Unsqueeze_3_output_0", "/blocks.28/self_attn/Concat_1_output_0", "/blocks.28/self_attn/Reshape_1_output_0", "/blocks.28/self_attn/Mul_2_output_0", "/blocks.28/self_attn/Shape_3_output_0", "Shape10536", "Rank10538", "BinaryOp10540", "Unsqueeze10541", "BinaryOp10543", "Unsqueeze10544", "StridedSlice10547", "Squeeze10548", "BinaryOp10549", "BinaryOp10550", "/blocks.28/self_attn/Gather_3_output_0", "/blocks.28/self_attn/Div_1_output_0", "/blocks.28/self_attn/Unsqueeze_9_output_0", "/blocks.28/self_attn/Slice_3_output_0", "/blocks.28/self_attn/Neg_1_output_0", "/blocks.28/self_attn/Unsqueeze_8_output_0", "/blocks.28/self_attn/Slice_2_output_0", "/blocks.28/self_attn/Concat_4_output_0", "/blocks.28/self_attn/Mul_3_output_0", "/blocks.28/self_attn/Add_1_output_0", "/blocks.28/self_attn/v_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_4_output_0", "/blocks.28/self_attn/Unsqueeze_5_output_0", "/blocks.28/self_attn/Concat_2_output_0", "/blocks.28/self_attn/Reshape_2_output_0", "/blocks.28/self_attn/Reshape_7_output_0", "/blocks.28/self_attn/o_proj/FakeLinear_output_0", "/blocks.28/Add_output_0", "/blocks.28/post_attention_layernorm/Mul_1_output_0", "/blocks.28/mlp/gate_proj/FakeLinear_output_0", "/blocks.28/mlp/act_fn/Mul_output_0", "/blocks.28/mlp/up_proj/FakeLinear_output_0", "/blocks.28/mlp/Mul_output_0", "/blocks.28/mlp/down_proj/FakeLinear_output_0", "/blocks.28/Add_1_output_0", "/blocks.29/Reshape_output_0", "/blocks.29/input_layernorm/Mul_1_output_0", "/blocks.29/self_attn/q_proj/FakeLinear_output_0", "/blocks.29/self_attn/Shape_output_0", "Shape10869", "Rank10871", "BinaryOp10873", "Unsqueeze10874", "BinaryOp10876", "Unsqueeze10877", "StridedSlice10880", "Squeeze10881", "BinaryOp10883", "/blocks.29/self_attn/Gather_output_0", "/blocks.29/self_attn/Unsqueeze_output_0", "Unsqueeze10891", "Unsqueeze10894", "StridedSlice10897", "Squeeze10898", "BinaryOp10899", "BinaryOp10900", "/blocks.29/self_attn/Gather_1_output_0", "/blocks.29/self_attn/Unsqueeze_1_output_0", "/blocks.29/self_attn/Concat_output_0", "/blocks.29/self_attn/Reshape_output_0", "/blocks.29/self_attn/Mul_output_0", "/blocks.29/self_attn/Shape_2_output_0", "Shape11001", "Rank11003", "BinaryOp11005", "Unsqueeze11006", "BinaryOp11008", "Unsqueeze11009", "StridedSlice11012", "Squeeze11013", "BinaryOp11014", "BinaryOp11015", "/blocks.29/self_attn/Gather_2_output_0", "/blocks.29/self_attn/Div_output_0", "/blocks.29/self_attn/Unsqueeze_7_output_0", "/blocks.29/self_attn/Slice_1_output_0", "/blocks.29/self_attn/Neg_output_0", "/blocks.29/self_attn/Unsqueeze_6_output_0", "/blocks.29/self_attn/Slice_output_0", "/blocks.29/self_attn/Concat_3_output_0", "/blocks.29/self_attn/Mul_1_output_0", "/blocks.29/self_attn/Add_output_0", "/blocks.29/self_attn/k_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_2_output_0", "/blocks.29/self_attn/Unsqueeze_3_output_0", "/blocks.29/self_attn/Concat_1_output_0", "/blocks.29/self_attn/Reshape_1_output_0", "/blocks.29/self_attn/Mul_2_output_0", "/blocks.29/self_attn/Shape_3_output_0", "Shape10907", "Rank10909", "BinaryOp10911", "Unsqueeze10912", "BinaryOp10914", "Unsqueeze10915", "StridedSlice10918", "Squeeze10919", "BinaryOp10920", "BinaryOp10921", "/blocks.29/self_attn/Gather_3_output_0", "/blocks.29/self_attn/Div_1_output_0", "/blocks.29/self_attn/Unsqueeze_9_output_0", "/blocks.29/self_attn/Slice_3_output_0", "/blocks.29/self_attn/Neg_1_output_0", "/blocks.29/self_attn/Unsqueeze_8_output_0", "/blocks.29/self_attn/Slice_2_output_0", "/blocks.29/self_attn/Concat_4_output_0", "/blocks.29/self_attn/Mul_3_output_0", "/blocks.29/self_attn/Add_1_output_0", "/blocks.29/self_attn/v_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_4_output_0", "/blocks.29/self_attn/Unsqueeze_5_output_0", "/blocks.29/self_attn/Concat_2_output_0", "/blocks.29/self_attn/Reshape_2_output_0", "/blocks.29/self_attn/Reshape_7_output_0", "/blocks.29/self_attn/o_proj/FakeLinear_output_0", "/blocks.29/Add_output_0", "/blocks.29/post_attention_layernorm/Mul_1_output_0", "/blocks.29/mlp/gate_proj/FakeLinear_output_0", "/blocks.29/mlp/act_fn/Mul_output_0", "/blocks.29/mlp/up_proj/FakeLinear_output_0", "/blocks.29/mlp/Mul_output_0", "/blocks.29/mlp/down_proj/FakeLinear_output_0", "/blocks.29/Add_1_output_0", "/blocks.30/Reshape_output_0", "/blocks.30/input_layernorm/Mul_1_output_0", "/blocks.30/self_attn/q_proj/FakeLinear_output_0", "/blocks.30/self_attn/Shape_output_0", "Shape11240", "Rank11242", "BinaryOp11244", "Unsqueeze11245", "BinaryOp11247", "Unsqueeze11248", "StridedSlice11251", "Squeeze11252", "BinaryOp11254", "/blocks.30/self_attn/Gather_output_0", "/blocks.30/self_attn/Unsqueeze_output_0", "Unsqueeze11262", "Unsqueeze11265", "StridedSlice11268", "Squeeze11269", "BinaryOp11270", "BinaryOp11271", "/blocks.30/self_attn/Gather_1_output_0", "/blocks.30/self_attn/Unsqueeze_1_output_0", "/blocks.30/self_attn/Concat_output_0", "/blocks.30/self_attn/Reshape_output_0", "/blocks.30/self_attn/Mul_output_0", "/blocks.30/self_attn/Shape_2_output_0", "Shape11372", "Rank11374", "BinaryOp11376", "Unsqueeze11377", "BinaryOp11379", "Unsqueeze11380", "StridedSlice11383", "Squeeze11384", "BinaryOp11385", "BinaryOp11386", "/blocks.30/self_attn/Gather_2_output_0", "/blocks.30/self_attn/Div_output_0", "/blocks.30/self_attn/Unsqueeze_7_output_0", "/blocks.30/self_attn/Slice_1_output_0", "/blocks.30/self_attn/Neg_output_0", "/blocks.30/self_attn/Unsqueeze_6_output_0", "/blocks.30/self_attn/Slice_output_0", "/blocks.30/self_attn/Concat_3_output_0", "/blocks.30/self_attn/Mul_1_output_0", "/blocks.30/self_attn/Add_output_0", "/blocks.30/self_attn/k_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_2_output_0", "/blocks.30/self_attn/Unsqueeze_3_output_0", "/blocks.30/self_attn/Concat_1_output_0", "/blocks.30/self_attn/Reshape_1_output_0", "/blocks.30/self_attn/Mul_2_output_0", "/blocks.30/self_attn/Shape_3_output_0", "Shape11278", "Rank11280", "BinaryOp11282", "Unsqueeze11283", "BinaryOp11285", "Unsqueeze11286", "StridedSlice11289", "Squeeze11290", "BinaryOp11291", "BinaryOp11292", "/blocks.30/self_attn/Gather_3_output_0", "/blocks.30/self_attn/Div_1_output_0", "/blocks.30/self_attn/Unsqueeze_9_output_0", "/blocks.30/self_attn/Slice_3_output_0", "/blocks.30/self_attn/Neg_1_output_0", "/blocks.30/self_attn/Unsqueeze_8_output_0", "/blocks.30/self_attn/Slice_2_output_0", "/blocks.30/self_attn/Concat_4_output_0", "/blocks.30/self_attn/Mul_3_output_0", "/blocks.30/self_attn/Add_1_output_0", "/blocks.30/self_attn/v_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_4_output_0", "/blocks.30/self_attn/Unsqueeze_5_output_0", "/blocks.30/self_attn/Concat_2_output_0", "/blocks.30/self_attn/Reshape_2_output_0", "/blocks.30/self_attn/Reshape_7_output_0", "/blocks.30/self_attn/o_proj/FakeLinear_output_0", "/blocks.30/Add_output_0", "/blocks.30/post_attention_layernorm/Mul_1_output_0", "/blocks.30/mlp/gate_proj/FakeLinear_output_0", "/blocks.30/mlp/act_fn/Mul_output_0", "/blocks.30/mlp/up_proj/FakeLinear_output_0", "/blocks.30/mlp/Mul_output_0", "/blocks.30/mlp/down_proj/FakeLinear_output_0", "/blocks.30/Add_1_output_0", "/blocks.31/Reshape_output_0", "/blocks.31/input_layernorm/Mul_1_output_0", "/blocks.31/self_attn/q_proj/FakeLinear_output_0", "/blocks.31/self_attn/Shape_output_0", "Shape11611", "Rank11613", "BinaryOp11615", "Unsqueeze11616", "BinaryOp11618", "Unsqueeze11619", "StridedSlice11622", "Squeeze11623", "BinaryOp11625", "/blocks.31/self_attn/Gather_output_0", "/blocks.31/self_attn/Unsqueeze_output_0", "Unsqueeze11633", "Unsqueeze11636", "StridedSlice11639", "Squeeze11640", "BinaryOp11641", "BinaryOp11642", "/blocks.31/self_attn/Gather_1_output_0", "/blocks.31/self_attn/Unsqueeze_1_output_0", "/blocks.31/self_attn/Concat_output_0", "/blocks.31/self_attn/Reshape_output_0", "/blocks.31/self_attn/Mul_output_0", "/blocks.31/self_attn/Shape_2_output_0", "Shape11712", "Rank11714", "BinaryOp11716", "Unsqueeze11717", "BinaryOp11719", "Unsqueeze11720", "StridedSlice11723", "Squeeze11724", "BinaryOp11725", "BinaryOp11726", "/blocks.31/self_attn/Gather_2_output_0", "/blocks.31/self_attn/Div_output_0", "/blocks.31/self_attn/Unsqueeze_7_output_0", "/blocks.31/self_attn/Slice_1_output_0", "/blocks.31/self_attn/Neg_output_0", "/blocks.31/self_attn/Unsqueeze_6_output_0", "/blocks.31/self_attn/Slice_output_0", "/blocks.31/self_attn/Concat_3_output_0", "/blocks.31/self_attn/Mul_1_output_0", "/blocks.31/self_attn/Add_output_0", "/blocks.31/self_attn/k_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_2_output_0", "/blocks.31/self_attn/Unsqueeze_3_output_0", "/blocks.31/self_attn/Concat_1_output_0", "/blocks.31/self_attn/Reshape_1_output_0", "/blocks.31/self_attn/Mul_2_output_0", "/blocks.31/self_attn/Shape_3_output_0", "Shape11649", "Rank11651", "BinaryOp11653", "Unsqueeze11654", "BinaryOp11656", "Unsqueeze11657", "StridedSlice11660", "Squeeze11661", "BinaryOp11662", "BinaryOp11663", "/blocks.31/self_attn/Gather_3_output_0", "/blocks.31/self_attn/Div_1_output_0", "/blocks.31/self_attn/Unsqueeze_9_output_0", "/blocks.31/self_attn/Slice_3_output_0", "/blocks.31/self_attn/Neg_1_output_0", "/blocks.31/self_attn/Unsqueeze_8_output_0", "/blocks.31/self_attn/Slice_2_output_0", "/blocks.31/self_attn/Concat_4_output_0", "/blocks.31/self_attn/Mul_3_output_0", "/blocks.31/self_attn/Add_1_output_0", "/blocks.31/self_attn/v_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_4_output_0", "/blocks.31/self_attn/Unsqueeze_5_output_0", "/blocks.31/self_attn/Concat_2_output_0", "/blocks.31/self_attn/Reshape_2_output_0", "/blocks.31/self_attn/Reshape_7_output_0", "/blocks.31/self_attn/o_proj/FakeLinear_output_0", "/blocks.31/Add_output_0", "/blocks.31/post_attention_layernorm/Mul_1_output_0", "/blocks.31/mlp/gate_proj/FakeLinear_output_0", "/blocks.31/mlp/act_fn/Mul_output_0", "/blocks.31/mlp/up_proj/FakeLinear_output_0", "/blocks.31/mlp/Mul_output_0", "/blocks.31/mlp/down_proj/FakeLinear_output_0", "/blocks.31/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/layers.30/self_attn/q_proj/Linear/pre_reshape", "/layers.30/self_attn/q_proj/Linear/pre_convert", "/layers.30/self_attn/q_proj/Linear", "/layers.30/self_attn/q_proj/Linear/post_convert", "/layers.30/self_attn/k_proj/Linear/pre_reshape", "/layers.30/self_attn/k_proj/Linear/pre_convert", "/layers.30/self_attn/k_proj/Linear", "/layers.30/self_attn/k_proj/Linear/post_convert", "/layers.30/self_attn/v_proj/Linear/pre_reshape", "/layers.30/self_attn/v_proj/Linear/pre_convert", "/layers.30/self_attn/v_proj/Linear", "/layers.30/self_attn/v_proj/Linear/post_convert", "/layers.30/self_attn/o_proj/Linear/pre_reshape", "/layers.30/self_attn/o_proj/Linear/pre_convert", "/layers.30/self_attn/o_proj/Linear", "/layers.30/self_attn/o_proj/Linear/post_convert", "/layers.30/mlp/gate_proj/Linear/pre_reshape", "/layers.30/mlp/gate_proj/Linear/pre_convert", "/layers.30/mlp/gate_proj/Linear", "/layers.30/mlp/gate_proj/Linear/post_convert", "/layers.30/mlp/up_proj/Linear/pre_reshape", "/layers.30/mlp/up_proj/Linear/pre_convert", "/layers.30/mlp/up_proj/Linear", "/layers.30/mlp/up_proj/Linear/post_convert", "/layers.30/mlp/down_proj/Linear/pre_reshape", "/layers.30/mlp/down_proj/Linear/pre_convert", "/layers.30/mlp/down_proj/Linear", "/layers.30/mlp/down_proj/Linear/post_convert", "/layers.31/self_attn/q_proj/Linear/pre_reshape", "/layers.31/self_attn/q_proj/Linear/pre_convert", "/layers.31/self_attn/q_proj/Linear", "/layers.31/self_attn/q_proj/Linear/post_convert", "/layers.31/self_attn/k_proj/Linear/pre_reshape", "/layers.31/self_attn/k_proj/Linear/pre_convert", "/layers.31/self_attn/k_proj/Linear", "/layers.31/self_attn/k_proj/Linear/post_convert", "/layers.31/self_attn/v_proj/Linear/pre_reshape", "/layers.31/self_attn/v_proj/Linear/pre_convert", "/layers.31/self_attn/v_proj/Linear", "/layers.31/self_attn/v_proj/Linear/post_convert", "/layers.31/self_attn/o_proj/Linear/pre_reshape", "/layers.31/self_attn/o_proj/Linear/pre_convert", "/layers.31/self_attn/o_proj/Linear", "/layers.31/self_attn/o_proj/Linear/post_convert", "/layers.31/mlp/gate_proj/Linear/pre_reshape", "/layers.31/mlp/gate_proj/Linear/pre_convert", "/layers.31/mlp/gate_proj/Linear", "/layers.31/mlp/gate_proj/Linear/post_convert", "/layers.31/mlp/up_proj/Linear/pre_reshape", "/layers.31/mlp/up_proj/Linear/pre_convert", "/layers.31/mlp/up_proj/Linear", "/layers.31/mlp/up_proj/Linear/post_convert", "/layers.31/mlp/down_proj/Linear/pre_reshape", "/layers.31/mlp/down_proj/Linear/pre_convert", "/layers.31/mlp/down_proj/Linear", "/layers.31/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "fad150ff-c08c-4af6-8db0-91b1fc602450" }