{ "bizCode": "MNNTest", "extraInfo": { "version": "3.2.5" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 4096 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 4 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 132 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 36, 2, 1, -1, 8, 128 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "past_key_values", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 3 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "Reshape", "main": { "dims": [ -1 ] , "dimType": "NCHW" } , "name": "presents", "outputIndexes": [ 1 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 4096 ] } , "name": "/blocks.0/Constant_output_0", "outputIndexes": [ 5 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/Reshape_output_0", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 0, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": [ 7 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3856 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3856 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3857 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3857 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 32768, 8388630, 2097152, 0, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 3858 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3858 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3859 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3859 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 8 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": [ 9 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Shape52", "outputIndexes": [ 10 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Rank54", "outputIndexes": [ 11 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 11, 11 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp56", "outputIndexes": [ 12 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze57", "outputIndexes": [ 13 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const9", "outputIndexes": [ 14 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp59", "outputIndexes": [ 15 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze60", "outputIndexes": [ 16 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze62", "outputIndexes": [ 17 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 13, 16, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice63", "outputIndexes": [ 18 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 18 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze64", "outputIndexes": [ 19 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 19 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp66", "outputIndexes": [ 20 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 20, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": [ 21 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_4_output_0", "outputIndexes": [ 22 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze76", "outputIndexes": [ 24 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze79", "outputIndexes": [ 25 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 24, 25, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice82", "outputIndexes": [ 26 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze83", "outputIndexes": [ 27 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 27 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp84", "outputIndexes": [ 28 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 27 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp85", "outputIndexes": [ 29 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 29, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": [ 30 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 31 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 32 ] } , "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": [ 32 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 128 ] } , "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": [ 33 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 23, 31, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": [ 34 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 34 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": [ 35 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 10518550, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.0/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 37 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 38 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 2 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1, 1 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 39 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38, 39 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/rotary/Reshape_output_0", "outputIndexes": [ 40 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 64 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.805842, 0.649382, 0.523299, 0.421697, 0.339821, 0.273842, 0.220673, 0.177828, 0.143301, 0.115478, 0.093057, 0.074989, 0.06043, 0.048697, 0.039242, 0.031623, 0.025483, 0.020535, 0.016548, 0.013335, 0.010746, 0.00866, 0.006978, 0.005375, 0.004132, 0.003168, 0.002423, 0.001848, 0.001405, 0.001064, 0.000803, 0.000603, 0.00045, 0.000334, 0.000246, 0.00018, 0.00013, 0.000093, 0.000065, 0.000044, 0.000036, 0.000029, 0.000023, 0.000019, 0.000015, 0.000012, 0.00001, 0.000008, 0.000006, 0.000005, 0.000004, 0.000003, 0.000003, 0.000002, 0.000002, 0.000001, 0.000001, 0.000001, 0.000001, 0.000001, 0.0, 0.0, 0.0 ] } , "name": "/rotary/Constant_2_output_0", "outputIndexes": [ 41 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 41 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 42 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 43 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 44 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 45 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 46 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 44, 46 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 47 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47, 47 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 48 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_7_output_0", "outputIndexes": [ 49 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 49 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 50 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 17 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 51 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.138629 ] } , "name": "/rotary/Constant_10_output_0", "outputIndexes": [ 52 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51, 52 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_1_output_0", "outputIndexes": [ 53 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53 ] , "main_type": "NONE", "name": "Shape118", "outputIndexes": [ 54 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 53 ] , "main_type": "NONE", "name": "Rank120", "outputIndexes": [ 55 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 55, 55 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp122", "outputIndexes": [ 56 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze123", "outputIndexes": [ 57 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp125", "outputIndexes": [ 58 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze126", "outputIndexes": [ 59 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 57, 59, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice129", "outputIndexes": [ 60 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze130", "outputIndexes": [ 61 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 61 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp132", "outputIndexes": [ 62 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 62, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": [ 63 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 63 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": [ 64 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": [ 65 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_10_output_0", "outputIndexes": [ 66 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65 ] , "main_type": "NONE", "name": "Shape260", "outputIndexes": [ 67 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 65 ] , "main_type": "NONE", "name": "Rank262", "outputIndexes": [ 68 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 68, 68 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp264", "outputIndexes": [ 69 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze265", "outputIndexes": [ 70 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp267", "outputIndexes": [ 71 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 71 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze268", "outputIndexes": [ 72 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 67, 70, 72, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice271", "outputIndexes": [ 73 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze272", "outputIndexes": [ 74 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 74 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp273", "outputIndexes": [ 75 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 74 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp274", "outputIndexes": [ 76 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65, 76, 69 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": [ 77 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_6_output_0", "outputIndexes": [ 78 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 77, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": [ 79 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 79, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 80 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/blocks.0/self_attn/Constant_19_output_0", "outputIndexes": [ 81 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_13_output_0", "outputIndexes": [ 82 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 80, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": [ 83 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 83 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": [ 84 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 79, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 85 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 22, 85, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": [ 86 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 84, 86 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": [ 87 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze169", "outputIndexes": [ 88 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze172", "outputIndexes": [ 89 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 88, 89, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice175", "outputIndexes": [ 90 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 90 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze176", "outputIndexes": [ 91 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 91 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp177", "outputIndexes": [ 92 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp178", "outputIndexes": [ 93 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 93, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": [ 94 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 87, 94 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": [ 95 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 64, 95 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": [ 96 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3857 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 10519574, 2097174, 524288, 0, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 3862 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3862 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3863 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3863 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 97 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 98 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 99 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 8 ] } , "name": "/blocks.0/self_attn/Constant_6_output_0", "outputIndexes": [ 100 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 99, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": [ 101 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 97, 101 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": [ 102 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 102 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 13141036, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.0/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 104 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 104, 63 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": [ 105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 104 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": [ 106 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 106 ] , "main_type": "NONE", "name": "Shape137", "outputIndexes": [ 107 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 106 ] , "main_type": "NONE", "name": "Rank139", "outputIndexes": [ 108 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 108, 108 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp141", "outputIndexes": [ 109 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze142", "outputIndexes": [ 110 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp144", "outputIndexes": [ 111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 111 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze145", "outputIndexes": [ 112 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 107, 110, 112, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice148", "outputIndexes": [ 113 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 113 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze149", "outputIndexes": [ 114 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 114 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp150", "outputIndexes": [ 115 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 115, 114 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp151", "outputIndexes": [ 116 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 106, 116, 109 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": [ 117 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 117, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": [ 118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 118, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 119 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 104, 119, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": [ 120 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 120 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": [ 121 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 118, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 122 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 104, 22, 122, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": [ 123 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 121, 123 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": [ 124 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 124, 94 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": [ 125 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105, 125 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": [ 126 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3857 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 13142060, 2097174, 524288, 0, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 3866 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3866 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3867 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3867 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 127 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 128 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 129 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 128, 129, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": [ 130 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127, 130 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": [ 131 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 126, 131, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.0/self_attn/Reshape_7_output_0", "outputIndexes": [ 133 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 133 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3868 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3868 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3869 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3869 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 15763522, 8388630, 2097152, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 3870 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3870 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3871 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3871 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 134 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 134 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_output_0", "outputIndexes": [ 135 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 26249304, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 136 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3872 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3872 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3873 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3873 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 26282072, 25165846, 6291456, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 3874 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3874 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3875 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3875 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 137 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": [ 138 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3873 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 57739374, 25165846, 6291456, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 3878 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3878 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3879 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3879 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 139 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 139 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": [ 140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3880 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3880 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3881 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3881 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 89196676, 25165846, 6291456, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 3882 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3882 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3883 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3883 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 141 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135, 141 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_1_output_0", "outputIndexes": [ 142 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 142, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/Reshape_output_0", "outputIndexes": [ 143 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 120653978, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": [ 144 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 144 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3884 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3884 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3885 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3885 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 120686746, 8388630, 2097152, 0, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 3886 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3886 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3887 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3887 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 145 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 144 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": [ 146 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 146 ] , "main_type": "NONE", "name": "Shape505", "outputIndexes": [ 147 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 146 ] , "main_type": "NONE", "name": "Rank507", "outputIndexes": [ 148 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 148 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp509", "outputIndexes": [ 149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze510", "outputIndexes": [ 150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp512", "outputIndexes": [ 151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze513", "outputIndexes": [ 152 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147, 150, 152, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice516", "outputIndexes": [ 153 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 153 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze517", "outputIndexes": [ 154 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 154, 154 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp519", "outputIndexes": [ 155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 146, 155, 149 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": [ 156 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": [ 157 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze527", "outputIndexes": [ 158 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze530", "outputIndexes": [ 159 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147, 158, 159, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice533", "outputIndexes": [ 160 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze534", "outputIndexes": [ 161 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 161 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp535", "outputIndexes": [ 162 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162, 161 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp536", "outputIndexes": [ 163 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 146, 163, 149 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": [ 164 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 157, 165, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": [ 166 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145, 166 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": [ 167 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 167 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 131172528, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.1/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 169 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze554", "outputIndexes": [ 170 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze557", "outputIndexes": [ 171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 170, 171, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice560", "outputIndexes": [ 172 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze561", "outputIndexes": [ 173 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 173 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp563", "outputIndexes": [ 174 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 174, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": [ 175 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169, 175 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": [ 176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": [ 177 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 177 ] , "main_type": "NONE", "name": "Shape686", "outputIndexes": [ 178 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 177 ] , "main_type": "NONE", "name": "Rank688", "outputIndexes": [ 179 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 179, 179 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp690", "outputIndexes": [ 180 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 180 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze691", "outputIndexes": [ 181 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 180, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp693", "outputIndexes": [ 182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze694", "outputIndexes": [ 183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 178, 181, 183, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice697", "outputIndexes": [ 184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 184 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze698", "outputIndexes": [ 185 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 185 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp699", "outputIndexes": [ 186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 185 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp700", "outputIndexes": [ 187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 177, 187, 180 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_4_output_0", "outputIndexes": [ 188 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": [ 189 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169, 190, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": [ 191 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": [ 192 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 193 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169, 22, 193, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": [ 194 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 192, 194 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": [ 195 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze596", "outputIndexes": [ 196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze599", "outputIndexes": [ 197 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 196, 197, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice602", "outputIndexes": [ 198 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 198 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze603", "outputIndexes": [ 199 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 199 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp604", "outputIndexes": [ 200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 200, 199 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp605", "outputIndexes": [ 201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 201, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": [ 202 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195, 202 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": [ 203 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 176, 203 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": [ 204 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3885 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131173552, 2097174, 524288, 0, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 3890 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3890 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3891 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3891 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 206 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 207 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 206, 207, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": [ 208 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 205, 208 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": [ 209 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 209 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 133795014, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.1/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 211 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 175 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": [ 212 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": [ 213 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 213 ] , "main_type": "NONE", "name": "Shape567", "outputIndexes": [ 214 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 213 ] , "main_type": "NONE", "name": "Rank569", "outputIndexes": [ 215 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 215, 215 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp571", "outputIndexes": [ 216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze572", "outputIndexes": [ 217 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp574", "outputIndexes": [ 218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze575", "outputIndexes": [ 219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 214, 217, 219, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice578", "outputIndexes": [ 220 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 220 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze579", "outputIndexes": [ 221 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 221 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp580", "outputIndexes": [ 222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 222, 221 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp581", "outputIndexes": [ 223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 213, 223, 216 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_5_output_0", "outputIndexes": [ 224 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": [ 225 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 226 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 226, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": [ 227 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": [ 228 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 229 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 22, 229, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": [ 230 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 230 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": [ 231 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 231, 202 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": [ 232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 212, 232 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": [ 233 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3885 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 133796038, 2097174, 524288, 0, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 3894 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3894 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3895 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3895 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 234 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 236 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235, 236, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": [ 237 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234, 237 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": [ 238 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 204, 233, 238, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.1/self_attn/Reshape_7_output_0", "outputIndexes": [ 239 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 239 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3896 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3896 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3897 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3897 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 136417500, 8388630, 2097152, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 3898 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3898 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3899 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3899 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 240 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143, 240 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_output_0", "outputIndexes": [ 241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 241 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 146903282, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 242 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 242 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3900 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3901 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3901 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 146936050, 25165846, 6291456, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 3902 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3902 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3903 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3903 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 243 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 243 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": [ 244 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3901 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 178393352, 25165846, 6291456, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 3906 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3906 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3907 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3907 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 245 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 244, 245 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": [ 246 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 246 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3908 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3908 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3909 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3909 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 209850654, 25165846, 6291456, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 3910 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3910 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3911 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3911 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 247 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 241, 247 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_1_output_0", "outputIndexes": [ 248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/Reshape_output_0", "outputIndexes": [ 249 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 249 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 241307956, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": [ 250 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3912 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3912 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3913 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3913 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 241340724, 8388630, 2097152, 0, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 3914 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3914 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3915 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3915 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 251 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": [ 252 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 252 ] , "main_type": "NONE", "name": "Shape925", "outputIndexes": [ 253 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 252 ] , "main_type": "NONE", "name": "Rank927", "outputIndexes": [ 254 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 254, 254 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp929", "outputIndexes": [ 255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze930", "outputIndexes": [ 256 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp932", "outputIndexes": [ 257 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze933", "outputIndexes": [ 258 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 256, 258, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice936", "outputIndexes": [ 259 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 259 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze937", "outputIndexes": [ 260 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 260, 260 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp939", "outputIndexes": [ 261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 252, 261, 255 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": [ 262 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": [ 263 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze947", "outputIndexes": [ 264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze950", "outputIndexes": [ 265 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 264, 265, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice953", "outputIndexes": [ 266 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 266 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze954", "outputIndexes": [ 267 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 267 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp955", "outputIndexes": [ 268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 268, 267 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp956", "outputIndexes": [ 269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 252, 269, 255 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": [ 270 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 271 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 263, 271, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": [ 272 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 272 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": [ 273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 273 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 251826506, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.2/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 275 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze974", "outputIndexes": [ 276 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze977", "outputIndexes": [ 277 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 276, 277, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice980", "outputIndexes": [ 278 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 278 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze981", "outputIndexes": [ 279 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 279, 279 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp983", "outputIndexes": [ 280 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 280, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": [ 281 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 281 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": [ 282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": [ 283 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 283 ] , "main_type": "NONE", "name": "Shape1106", "outputIndexes": [ 284 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 283 ] , "main_type": "NONE", "name": "Rank1108", "outputIndexes": [ 285 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 285, 285 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1110", "outputIndexes": [ 286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1111", "outputIndexes": [ 287 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1113", "outputIndexes": [ 288 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1114", "outputIndexes": [ 289 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284, 287, 289, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1117", "outputIndexes": [ 290 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 290 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1118", "outputIndexes": [ 291 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 291 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1119", "outputIndexes": [ 292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 292, 291 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1120", "outputIndexes": [ 293 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 283, 293, 286 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_4_output_0", "outputIndexes": [ 294 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 294, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": [ 295 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 295, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 296 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 296, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": [ 297 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 297 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": [ 298 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 295, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 22, 299, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": [ 300 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 298, 300 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": [ 301 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1016", "outputIndexes": [ 302 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1019", "outputIndexes": [ 303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 302, 303, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1022", "outputIndexes": [ 304 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 304 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1023", "outputIndexes": [ 305 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 305 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1024", "outputIndexes": [ 306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 306, 305 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1025", "outputIndexes": [ 307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 307, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": [ 308 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 301, 308 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": [ 309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282, 309 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": [ 310 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3913 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 251827530, 2097174, 524288, 0, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 3918 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3918 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3919 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3919 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 311 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 312 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 313 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 312, 313, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": [ 314 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 311, 314 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": [ 315 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 254448992, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.2/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 317 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 281 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": [ 318 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": [ 319 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 319 ] , "main_type": "NONE", "name": "Shape987", "outputIndexes": [ 320 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 319 ] , "main_type": "NONE", "name": "Rank989", "outputIndexes": [ 321 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321, 321 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp991", "outputIndexes": [ 322 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 322 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze992", "outputIndexes": [ 323 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 322, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp994", "outputIndexes": [ 324 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 324 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze995", "outputIndexes": [ 325 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 320, 323, 325, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice998", "outputIndexes": [ 326 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze999", "outputIndexes": [ 327 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 327 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1000", "outputIndexes": [ 328 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 327 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1001", "outputIndexes": [ 329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319, 329, 322 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_5_output_0", "outputIndexes": [ 330 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 330, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": [ 331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 332 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 332, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": [ 333 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 333 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": [ 334 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 335 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 22, 335, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": [ 336 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 336 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": [ 337 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 308 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": [ 338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318, 338 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": [ 339 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3913 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 254450016, 2097174, 524288, 0, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 3922 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3922 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3923 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3923 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 340 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 341 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 342 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 341, 342, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": [ 343 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 340, 343 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": [ 344 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310, 339, 344, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.2/self_attn/Reshape_7_output_0", "outputIndexes": [ 345 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 345 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3924 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3924 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3925 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3925 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 257071478, 8388630, 2097152, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 3926 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3926 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3927 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3927 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 346 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 249, 346 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_output_0", "outputIndexes": [ 347 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 347 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 267557260, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 348 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 348 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3928 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3928 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3929 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3929 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 267590028, 25165846, 6291456, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 3930 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3930 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3931 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3931 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 349 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 349 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": [ 350 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3929 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 299047330, 25165846, 6291456, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 3934 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3934 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3935 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3935 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 351 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 350, 351 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": [ 352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 352 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3936 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3937 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3937 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 330504632, 25165846, 6291456, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 3938 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3938 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3939 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3939 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 353 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 347, 353 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_1_output_0", "outputIndexes": [ 354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 354, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/Reshape_output_0", "outputIndexes": [ 355 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 355 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 361961934, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": [ 356 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 356 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3940 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3940 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3941 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3941 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 361994702, 8388630, 2097152, 0, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 3942 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3942 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3943 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3943 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 357 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 356 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": [ 358 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 358 ] , "main_type": "NONE", "name": "Shape1345", "outputIndexes": [ 359 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 358 ] , "main_type": "NONE", "name": "Rank1347", "outputIndexes": [ 360 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 360, 360 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1349", "outputIndexes": [ 361 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1350", "outputIndexes": [ 362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1352", "outputIndexes": [ 363 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 363 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1353", "outputIndexes": [ 364 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 359, 362, 364, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1356", "outputIndexes": [ 365 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 365 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1357", "outputIndexes": [ 366 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 366 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1359", "outputIndexes": [ 367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 358, 367, 361 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": [ 368 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": [ 369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1367", "outputIndexes": [ 370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 363 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1370", "outputIndexes": [ 371 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 359, 370, 371, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1373", "outputIndexes": [ 372 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 372 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1374", "outputIndexes": [ 373 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 373 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1375", "outputIndexes": [ 374 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 374, 373 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1376", "outputIndexes": [ 375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 358, 375, 361 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": [ 376 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 376, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 377 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369, 377, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": [ 378 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 357, 378 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": [ 379 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 379 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 372480484, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.3/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 381 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1394", "outputIndexes": [ 382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1397", "outputIndexes": [ 383 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 382, 383, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1400", "outputIndexes": [ 384 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1401", "outputIndexes": [ 385 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 385, 385 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1403", "outputIndexes": [ 386 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 386, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": [ 387 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 387 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": [ 388 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": [ 389 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 389 ] , "main_type": "NONE", "name": "Shape1526", "outputIndexes": [ 390 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 389 ] , "main_type": "NONE", "name": "Rank1528", "outputIndexes": [ 391 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 391, 391 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1530", "outputIndexes": [ 392 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1531", "outputIndexes": [ 393 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1533", "outputIndexes": [ 394 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1534", "outputIndexes": [ 395 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 390, 393, 395, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1537", "outputIndexes": [ 396 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1538", "outputIndexes": [ 397 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 397 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1539", "outputIndexes": [ 398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 398, 397 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1540", "outputIndexes": [ 399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 389, 399, 392 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_4_output_0", "outputIndexes": [ 400 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 400, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": [ 401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 402 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 402, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": [ 403 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": [ 404 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 405 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 22, 405, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": [ 406 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404, 406 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": [ 407 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1436", "outputIndexes": [ 408 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1439", "outputIndexes": [ 409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 408, 409, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1442", "outputIndexes": [ 410 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1443", "outputIndexes": [ 411 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 411 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1444", "outputIndexes": [ 412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412, 411 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1445", "outputIndexes": [ 413 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 413, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": [ 414 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 407, 414 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": [ 415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 388, 415 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": [ 416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3941 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 372481508, 2097174, 524288, 0, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 3946 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3946 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3947 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3947 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 417 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 376, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 419 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 418, 419, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": [ 420 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417, 420 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": [ 421 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 375102970, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.3/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 423 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 387 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": [ 424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": [ 425 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 425 ] , "main_type": "NONE", "name": "Shape1407", "outputIndexes": [ 426 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 425 ] , "main_type": "NONE", "name": "Rank1409", "outputIndexes": [ 427 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 427, 427 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1411", "outputIndexes": [ 428 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1412", "outputIndexes": [ 429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1414", "outputIndexes": [ 430 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 430 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1415", "outputIndexes": [ 431 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 429, 431, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1418", "outputIndexes": [ 432 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 432 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1419", "outputIndexes": [ 433 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 433 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1420", "outputIndexes": [ 434 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 434, 433 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1421", "outputIndexes": [ 435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 425, 435, 428 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_5_output_0", "outputIndexes": [ 436 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 436, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": [ 437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 438 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 438, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": [ 439 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": [ 440 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 441 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 22, 441, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": [ 442 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 442 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": [ 443 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 443, 414 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": [ 444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424, 444 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": [ 445 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3941 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 375103994, 2097174, 524288, 0, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 3950 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3950 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3951 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3951 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 446 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 447 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 376, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 448 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 447, 448, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": [ 449 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 446, 449 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": [ 450 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 416, 445, 450, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.3/self_attn/Reshape_7_output_0", "outputIndexes": [ 451 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 451 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3952 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3952 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3953 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3953 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 377725456, 8388630, 2097152, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 3954 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3954 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3955 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3955 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 452 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 355, 452 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_output_0", "outputIndexes": [ 453 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 388211238, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 454 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 454 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3956 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3956 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3957 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3957 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 388244006, 25165846, 6291456, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 3958 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3958 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3959 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3959 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": [ 456 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3957 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 419701308, 25165846, 6291456, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 3962 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3962 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3963 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3963 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 457 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 456, 457 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": [ 458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3964 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3964 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3965 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3965 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 451158610, 25165846, 6291456, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 3966 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3966 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3967 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3967 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 459 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 459 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_1_output_0", "outputIndexes": [ 460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/Reshape_output_0", "outputIndexes": [ 461 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 461 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 482615912, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": [ 462 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3968 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3968 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3969 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3969 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 482648680, 8388630, 2097152, 0, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 3970 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3970 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3971 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3971 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 463 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": [ 464 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 464 ] , "main_type": "NONE", "name": "Shape1765", "outputIndexes": [ 465 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 464 ] , "main_type": "NONE", "name": "Rank1767", "outputIndexes": [ 466 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 466, 466 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1769", "outputIndexes": [ 467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1770", "outputIndexes": [ 468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1772", "outputIndexes": [ 469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1773", "outputIndexes": [ 470 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 465, 468, 470, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1776", "outputIndexes": [ 471 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 471 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1777", "outputIndexes": [ 472 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 472, 472 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1779", "outputIndexes": [ 473 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464, 473, 467 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": [ 474 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 474, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": [ 475 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1787", "outputIndexes": [ 476 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1790", "outputIndexes": [ 477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 465, 476, 477, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1793", "outputIndexes": [ 478 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1794", "outputIndexes": [ 479 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 479 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1795", "outputIndexes": [ 480 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 480, 479 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1796", "outputIndexes": [ 481 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464, 481, 467 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": [ 482 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 482, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 483 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 475, 483, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": [ 484 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 463, 484 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": [ 485 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 493134462, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.4/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 487 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1814", "outputIndexes": [ 488 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1817", "outputIndexes": [ 489 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 488, 489, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1820", "outputIndexes": [ 490 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1821", "outputIndexes": [ 491 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491, 491 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1823", "outputIndexes": [ 492 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 492, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": [ 493 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487, 493 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": [ 494 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": [ 495 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 495 ] , "main_type": "NONE", "name": "Shape1947", "outputIndexes": [ 496 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 495 ] , "main_type": "NONE", "name": "Rank1949", "outputIndexes": [ 497 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 497 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1951", "outputIndexes": [ 498 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1952", "outputIndexes": [ 499 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1954", "outputIndexes": [ 500 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 500 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1955", "outputIndexes": [ 501 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 499, 501, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1958", "outputIndexes": [ 502 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 502 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1959", "outputIndexes": [ 503 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 503 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1960", "outputIndexes": [ 504 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 503 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1961", "outputIndexes": [ 505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 505, 498 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_4_output_0", "outputIndexes": [ 506 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": [ 507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 507, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487, 508, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": [ 509 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 509 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": [ 510 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 507, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 511 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487, 22, 511, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": [ 512 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510, 512 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": [ 513 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1856", "outputIndexes": [ 514 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1859", "outputIndexes": [ 515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 514, 515, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1862", "outputIndexes": [ 516 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 516 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1863", "outputIndexes": [ 517 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 517 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1864", "outputIndexes": [ 518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 518, 517 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1865", "outputIndexes": [ 519 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 519, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": [ 520 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 513, 520 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": [ 521 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494, 521 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": [ 522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3969 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 493135486, 2097174, 524288, 0, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 3974 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3974 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3975 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3975 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 474, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 524 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 482, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524, 525, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": [ 526 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 523, 526 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": [ 527 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 527 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 495756948, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.4/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 529 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 493 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": [ 530 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": [ 531 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 531 ] , "main_type": "NONE", "name": "Shape1827", "outputIndexes": [ 532 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 531 ] , "main_type": "NONE", "name": "Rank1829", "outputIndexes": [ 533 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 533, 533 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1831", "outputIndexes": [ 534 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 534 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1832", "outputIndexes": [ 535 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 534, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1834", "outputIndexes": [ 536 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 536 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1835", "outputIndexes": [ 537 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 535, 537, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1838", "outputIndexes": [ 538 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 538 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1839", "outputIndexes": [ 539 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 539 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1840", "outputIndexes": [ 540 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 540, 539 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1841", "outputIndexes": [ 541 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 531, 541, 534 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_5_output_0", "outputIndexes": [ 542 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": [ 543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 543, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 544 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 544, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": [ 545 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 545 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": [ 546 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 543, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 547 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 22, 547, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": [ 548 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 548 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": [ 549 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549, 520 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": [ 550 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 530, 550 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": [ 551 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3969 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 495757972, 2097174, 524288, 0, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 3978 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3978 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3979 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3979 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 552 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 474, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 553 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 482, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 554 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 553, 554, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": [ 555 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 552, 555 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": [ 556 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522, 551, 556, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.4/self_attn/Reshape_7_output_0", "outputIndexes": [ 557 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 557 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3980 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3980 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3981 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3981 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 498379434, 8388630, 2097152, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 3982 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3982 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3983 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3983 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 558 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 461, 558 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_output_0", "outputIndexes": [ 559 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 559 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 508865216, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 560 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 560 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3984 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3984 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3985 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3985 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 508897984, 25165846, 6291456, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 3986 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3986 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3987 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3987 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 561 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 561 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": [ 562 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3985 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 540355286, 25165846, 6291456, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 3990 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3990 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3991 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3991 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 563 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 562, 563 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": [ 564 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 564 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3992 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3992 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3993 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3993 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 571812588, 25165846, 6291456, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 3994 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3994 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3995 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3995 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 565 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 559, 565 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_1_output_0", "outputIndexes": [ 566 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/Reshape_output_0", "outputIndexes": [ 567 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 567 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 603269890, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": [ 568 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 568 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3996 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3996 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3997 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3997 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 603302658, 8388630, 2097152, 0, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 3998 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3998 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3999 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3999 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 569 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 568 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": [ 570 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 570 ] , "main_type": "NONE", "name": "Shape2186", "outputIndexes": [ 571 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 570 ] , "main_type": "NONE", "name": "Rank2188", "outputIndexes": [ 572 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572, 572 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2190", "outputIndexes": [ 573 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2191", "outputIndexes": [ 574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2193", "outputIndexes": [ 575 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2194", "outputIndexes": [ 576 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571, 574, 576, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2197", "outputIndexes": [ 577 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 577 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2198", "outputIndexes": [ 578 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 578, 578 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2200", "outputIndexes": [ 579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570, 579, 573 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": [ 580 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": [ 581 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2208", "outputIndexes": [ 582 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2211", "outputIndexes": [ 583 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571, 582, 583, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2214", "outputIndexes": [ 584 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2215", "outputIndexes": [ 585 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 585 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2216", "outputIndexes": [ 586 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 585 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2217", "outputIndexes": [ 587 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570, 587, 573 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": [ 588 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581, 589, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": [ 590 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 569, 590 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": [ 591 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 613788440, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.5/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 593 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2235", "outputIndexes": [ 594 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2238", "outputIndexes": [ 595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 594, 595, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2241", "outputIndexes": [ 596 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2242", "outputIndexes": [ 597 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 597, 597 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2244", "outputIndexes": [ 598 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 598, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": [ 599 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 599 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": [ 600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": [ 601 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 601 ] , "main_type": "NONE", "name": "Shape2368", "outputIndexes": [ 602 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 601 ] , "main_type": "NONE", "name": "Rank2370", "outputIndexes": [ 603 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603, 603 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2372", "outputIndexes": [ 604 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2373", "outputIndexes": [ 605 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2375", "outputIndexes": [ 606 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2376", "outputIndexes": [ 607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 602, 605, 607, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2379", "outputIndexes": [ 608 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2380", "outputIndexes": [ 609 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 609 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2381", "outputIndexes": [ 610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610, 609 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2382", "outputIndexes": [ 611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 611, 604 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_4_output_0", "outputIndexes": [ 612 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 612, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": [ 613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 614, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": [ 615 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 615 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": [ 616 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 617 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 22, 617, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": [ 618 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 616, 618 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": [ 619 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2277", "outputIndexes": [ 620 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2280", "outputIndexes": [ 621 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 620, 621, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2283", "outputIndexes": [ 622 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 622 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2284", "outputIndexes": [ 623 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 623 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2285", "outputIndexes": [ 624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 624, 623 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2286", "outputIndexes": [ 625 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 625, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": [ 626 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 619, 626 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": [ 627 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 600, 627 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": [ 628 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3997 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 613789464, 2097174, 524288, 0, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 4002 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4002 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4003 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4003 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 630 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 631 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 631, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": [ 632 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 629, 632 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": [ 633 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 616410926, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.5/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 635 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 599 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": [ 636 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": [ 637 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 637 ] , "main_type": "NONE", "name": "Shape2248", "outputIndexes": [ 638 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 637 ] , "main_type": "NONE", "name": "Rank2250", "outputIndexes": [ 639 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 639, 639 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2252", "outputIndexes": [ 640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 640 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2253", "outputIndexes": [ 641 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 640, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2255", "outputIndexes": [ 642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 642 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2256", "outputIndexes": [ 643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638, 641, 643, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2259", "outputIndexes": [ 644 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2260", "outputIndexes": [ 645 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 645 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2261", "outputIndexes": [ 646 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 646, 645 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2262", "outputIndexes": [ 647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 637, 647, 640 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_5_output_0", "outputIndexes": [ 648 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 648, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": [ 649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 649, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 650 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 650, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": [ 651 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 651 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": [ 652 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 649, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 653 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 22, 653, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": [ 654 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 652, 654 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": [ 655 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 655, 626 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": [ 656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636, 656 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": [ 657 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3997 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 616411950, 2097174, 524288, 0, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 4006 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4006 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4007 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4007 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 658 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 659 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 660 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659, 660, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": [ 661 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 658, 661 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": [ 662 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628, 657, 662, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.5/self_attn/Reshape_7_output_0", "outputIndexes": [ 663 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4008 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4008 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4009 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4009 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 619033412, 8388630, 2097152, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 4010 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4010 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4011 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4011 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 664 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 567, 664 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_output_0", "outputIndexes": [ 665 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 665 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 629519194, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 666 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4012 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4012 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4013 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4013 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 629551962, 25165846, 6291456, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 4014 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4014 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4015 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4015 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 667 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 667 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": [ 668 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4013 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 661009264, 25165846, 6291456, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 4018 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4018 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4019 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4019 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668, 669 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": [ 670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4020 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4020 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4021 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4021 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 692466566, 25165846, 6291456, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 4022 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4022 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4023 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4023 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 665, 671 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_1_output_0", "outputIndexes": [ 672 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/Reshape_output_0", "outputIndexes": [ 673 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 723923868, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": [ 674 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4024 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4024 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4025 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4025 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 723956636, 8388630, 2097152, 0, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 4026 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4026 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4027 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4027 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 675 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": [ 676 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 676 ] , "main_type": "NONE", "name": "Shape2607", "outputIndexes": [ 677 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 676 ] , "main_type": "NONE", "name": "Rank2609", "outputIndexes": [ 678 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 678, 678 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2611", "outputIndexes": [ 679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2612", "outputIndexes": [ 680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2614", "outputIndexes": [ 681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 681 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2615", "outputIndexes": [ 682 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677, 680, 682, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2618", "outputIndexes": [ 683 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 683 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2619", "outputIndexes": [ 684 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 684 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2621", "outputIndexes": [ 685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 685, 679 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": [ 686 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 686, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": [ 687 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2629", "outputIndexes": [ 688 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 681 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2632", "outputIndexes": [ 689 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677, 688, 689, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2635", "outputIndexes": [ 690 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2636", "outputIndexes": [ 691 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 691 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2637", "outputIndexes": [ 692 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 691 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2638", "outputIndexes": [ 693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 693, 679 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": [ 694 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 687, 695, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": [ 696 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675, 696 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": [ 697 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 734442418, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.6/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 699 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2656", "outputIndexes": [ 700 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2659", "outputIndexes": [ 701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 700, 701, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2662", "outputIndexes": [ 702 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2663", "outputIndexes": [ 703 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703, 703 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2665", "outputIndexes": [ 704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 704, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": [ 705 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699, 705 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": [ 706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": [ 707 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 707 ] , "main_type": "NONE", "name": "Shape2789", "outputIndexes": [ 708 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 707 ] , "main_type": "NONE", "name": "Rank2791", "outputIndexes": [ 709 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709, 709 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2793", "outputIndexes": [ 710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2794", "outputIndexes": [ 711 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2796", "outputIndexes": [ 712 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 712 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2797", "outputIndexes": [ 713 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 708, 711, 713, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2800", "outputIndexes": [ 714 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 714 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2801", "outputIndexes": [ 715 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 715 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2802", "outputIndexes": [ 716 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 716, 715 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2803", "outputIndexes": [ 717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707, 717, 710 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_4_output_0", "outputIndexes": [ 718 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": [ 719 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 719, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 720 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699, 720, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": [ 721 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 721 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": [ 722 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 719, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 723 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699, 22, 723, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": [ 724 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 724 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": [ 725 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2698", "outputIndexes": [ 726 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2701", "outputIndexes": [ 727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 726, 727, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2704", "outputIndexes": [ 728 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 728 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2705", "outputIndexes": [ 729 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 729 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2706", "outputIndexes": [ 730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 730, 729 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2707", "outputIndexes": [ 731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 731, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": [ 732 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725, 732 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": [ 733 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 706, 733 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": [ 734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4025 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 734443442, 2097174, 524288, 0, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 4030 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4030 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4031 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4031 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 686, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 736 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 737 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736, 737, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": [ 738 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 735, 738 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": [ 739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 739 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 737064904, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.6/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 741 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 741, 705 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": [ 742 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 741 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": [ 743 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 743 ] , "main_type": "NONE", "name": "Shape2669", "outputIndexes": [ 744 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 743 ] , "main_type": "NONE", "name": "Rank2671", "outputIndexes": [ 745 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 745, 745 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2673", "outputIndexes": [ 746 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 746 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2674", "outputIndexes": [ 747 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 746, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2676", "outputIndexes": [ 748 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 748 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2677", "outputIndexes": [ 749 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 744, 747, 749, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2680", "outputIndexes": [ 750 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2681", "outputIndexes": [ 751 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 751 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2682", "outputIndexes": [ 752 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752, 751 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2683", "outputIndexes": [ 753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 743, 753, 746 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_5_output_0", "outputIndexes": [ 754 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 754, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": [ 755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 756 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 741, 756, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": [ 757 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": [ 758 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 759 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 741, 22, 759, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": [ 760 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758, 760 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": [ 761 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 732 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": [ 762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 742, 762 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": [ 763 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4025 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 737065928, 2097174, 524288, 0, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 4034 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4034 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4035 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4035 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 764 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 686, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 766 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 765, 766, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": [ 767 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764, 767 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": [ 768 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 763, 768, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.6/self_attn/Reshape_7_output_0", "outputIndexes": [ 769 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4036 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4036 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4037 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4037 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 739687390, 8388630, 2097152, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 4038 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4038 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4039 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4039 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 770 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 770 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_output_0", "outputIndexes": [ 771 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 750173172, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 772 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 772 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4040 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4040 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4041 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4041 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 750205940, 25165846, 6291456, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 4042 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4042 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4043 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4043 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 773 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 773 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": [ 774 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4041 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 781663242, 25165846, 6291456, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 4046 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4046 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4047 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4047 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 775 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 774, 775 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": [ 776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 776 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4048 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4048 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4049 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4049 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 813120544, 25165846, 6291456, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 4050 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4050 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4051 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4051 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 777 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 777 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_1_output_0", "outputIndexes": [ 778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 778, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/Reshape_output_0", "outputIndexes": [ 779 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 844577846, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": [ 780 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 780 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4052 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4052 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4053 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4053 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 844610614, 8388630, 2097152, 0, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 4054 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4054 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4055 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4055 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 781 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 780 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": [ 782 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 782 ] , "main_type": "NONE", "name": "Shape3028", "outputIndexes": [ 783 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 782 ] , "main_type": "NONE", "name": "Rank3030", "outputIndexes": [ 784 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 784 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3032", "outputIndexes": [ 785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3033", "outputIndexes": [ 786 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3035", "outputIndexes": [ 787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3036", "outputIndexes": [ 788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783, 786, 788, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3039", "outputIndexes": [ 789 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3040", "outputIndexes": [ 790 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 790, 790 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3042", "outputIndexes": [ 791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 791, 785 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": [ 792 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": [ 793 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3050", "outputIndexes": [ 794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3053", "outputIndexes": [ 795 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783, 794, 795, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3056", "outputIndexes": [ 796 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3057", "outputIndexes": [ 797 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 797 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3058", "outputIndexes": [ 798 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798, 797 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3059", "outputIndexes": [ 799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 799, 785 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": [ 800 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 801 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 801, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": [ 802 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 781, 802 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": [ 803 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 803 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 855096396, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.7/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 805 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3077", "outputIndexes": [ 806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3080", "outputIndexes": [ 807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 806, 807, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3083", "outputIndexes": [ 808 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 808 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3084", "outputIndexes": [ 809 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 809 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3086", "outputIndexes": [ 810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 810, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": [ 811 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 811 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": [ 812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": [ 813 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Shape3210", "outputIndexes": [ 814 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Rank3212", "outputIndexes": [ 815 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 815, 815 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3214", "outputIndexes": [ 816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3215", "outputIndexes": [ 817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3217", "outputIndexes": [ 818 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3218", "outputIndexes": [ 819 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814, 817, 819, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3221", "outputIndexes": [ 820 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3222", "outputIndexes": [ 821 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 821 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3223", "outputIndexes": [ 822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 822, 821 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3224", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 813, 823, 816 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_4_output_0", "outputIndexes": [ 824 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 824, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": [ 825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 826 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 826, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": [ 827 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 827 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": [ 828 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 22, 829, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": [ 830 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 828, 830 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": [ 831 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3119", "outputIndexes": [ 832 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3122", "outputIndexes": [ 833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 832, 833, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3125", "outputIndexes": [ 834 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 834 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3126", "outputIndexes": [ 835 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 835 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3127", "outputIndexes": [ 836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 836, 835 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3128", "outputIndexes": [ 837 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 837, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": [ 838 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 831, 838 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": [ 839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 812, 839 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": [ 840 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4053 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 855097420, 2097174, 524288, 0, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 4058 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4058 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4059 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4059 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 841 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 842 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 843 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 842, 843, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": [ 844 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841, 844 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": [ 845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 845 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 857718882, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.7/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 847 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 811 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": [ 848 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": [ 849 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 849 ] , "main_type": "NONE", "name": "Shape3090", "outputIndexes": [ 850 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 849 ] , "main_type": "NONE", "name": "Rank3092", "outputIndexes": [ 851 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 851 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3094", "outputIndexes": [ 852 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3095", "outputIndexes": [ 853 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3097", "outputIndexes": [ 854 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 854 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3098", "outputIndexes": [ 855 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 853, 855, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3101", "outputIndexes": [ 856 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 856 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3102", "outputIndexes": [ 857 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 857 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3103", "outputIndexes": [ 858 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 858, 857 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3104", "outputIndexes": [ 859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 859, 852 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_5_output_0", "outputIndexes": [ 860 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": [ 861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 861, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 862 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 862, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": [ 863 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 863 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": [ 864 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 861, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 22, 865, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": [ 866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 864, 866 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": [ 867 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 867, 838 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": [ 868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848, 868 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": [ 869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4053 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 857719906, 2097174, 524288, 0, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 4062 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4062 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4063 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4063 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 870 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 871 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 872 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 872, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": [ 873 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 873 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": [ 874 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 840, 869, 874, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.7/self_attn/Reshape_7_output_0", "outputIndexes": [ 875 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4064 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4064 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4065 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4065 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 860341368, 8388630, 2097152, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 4066 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4066 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4067 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4067 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 876 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 876 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_output_0", "outputIndexes": [ 877 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 877 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 870827150, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 878 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4068 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4068 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4069 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4069 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 870859918, 25165846, 6291456, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 4070 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4070 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4071 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4071 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 879 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 879 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": [ 880 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4069 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 902317220, 25165846, 6291456, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 4074 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4074 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4075 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4075 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 881 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880, 881 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": [ 882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4076 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4076 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4077 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4077 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 933774522, 25165846, 6291456, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 4078 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4078 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4079 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4079 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 883 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 877, 883 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_1_output_0", "outputIndexes": [ 884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/Reshape_output_0", "outputIndexes": [ 885 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 965231824, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": [ 886 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4080 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4080 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4081 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4081 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 965264592, 8388630, 2097152, 0, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 4082 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4082 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4083 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4083 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 887 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": [ 888 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 888 ] , "main_type": "NONE", "name": "Shape3449", "outputIndexes": [ 889 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 888 ] , "main_type": "NONE", "name": "Rank3451", "outputIndexes": [ 890 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 890, 890 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3453", "outputIndexes": [ 891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3454", "outputIndexes": [ 892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3456", "outputIndexes": [ 893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3457", "outputIndexes": [ 894 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889, 892, 894, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3460", "outputIndexes": [ 895 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 895 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3461", "outputIndexes": [ 896 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 896, 896 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3463", "outputIndexes": [ 897 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 897, 891 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": [ 898 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": [ 899 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3471", "outputIndexes": [ 900 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3474", "outputIndexes": [ 901 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889, 900, 901, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3477", "outputIndexes": [ 902 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3478", "outputIndexes": [ 903 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 903 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3479", "outputIndexes": [ 904 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 903 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3480", "outputIndexes": [ 905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 905, 891 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": [ 906 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 906, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 907 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 899, 907, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": [ 908 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887, 908 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": [ 909 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 975750374, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.8/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 911 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3498", "outputIndexes": [ 912 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3501", "outputIndexes": [ 913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 912, 913, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3504", "outputIndexes": [ 914 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3505", "outputIndexes": [ 915 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 915, 915 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3507", "outputIndexes": [ 916 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 916, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": [ 917 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 917 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": [ 918 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": [ 919 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 919 ] , "main_type": "NONE", "name": "Shape3631", "outputIndexes": [ 920 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 919 ] , "main_type": "NONE", "name": "Rank3633", "outputIndexes": [ 921 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 921, 921 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3635", "outputIndexes": [ 922 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 922 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3636", "outputIndexes": [ 923 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 922, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3638", "outputIndexes": [ 924 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 924 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3639", "outputIndexes": [ 925 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 920, 923, 925, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3642", "outputIndexes": [ 926 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 926 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3643", "outputIndexes": [ 927 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 927 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3644", "outputIndexes": [ 928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928, 927 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3645", "outputIndexes": [ 929 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 919, 929, 922 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_4_output_0", "outputIndexes": [ 930 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 930, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": [ 931 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 932 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 932, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": [ 933 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 933 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": [ 934 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 935 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 22, 935, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": [ 936 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 934, 936 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": [ 937 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3540", "outputIndexes": [ 938 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3543", "outputIndexes": [ 939 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 938, 939, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3546", "outputIndexes": [ 940 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3547", "outputIndexes": [ 941 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 941 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3548", "outputIndexes": [ 942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 941 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3549", "outputIndexes": [ 943 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 943, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": [ 944 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937, 944 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": [ 945 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918, 945 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": [ 946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4081 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 975751398, 2097174, 524288, 0, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 4086 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4086 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4087 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4087 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 947 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 948 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 906, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 949 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 948, 949, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": [ 950 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 947, 950 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": [ 951 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 951 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 978372860, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.8/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 953 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953, 917 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": [ 954 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": [ 955 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 955 ] , "main_type": "NONE", "name": "Shape3511", "outputIndexes": [ 956 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 955 ] , "main_type": "NONE", "name": "Rank3513", "outputIndexes": [ 957 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 957 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3515", "outputIndexes": [ 958 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 958 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3516", "outputIndexes": [ 959 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 958, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3518", "outputIndexes": [ 960 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3519", "outputIndexes": [ 961 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 956, 959, 961, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3522", "outputIndexes": [ 962 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3523", "outputIndexes": [ 963 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 963 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3524", "outputIndexes": [ 964 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 964, 963 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3525", "outputIndexes": [ 965 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 965, 958 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_5_output_0", "outputIndexes": [ 966 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 966, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": [ 967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 968 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953, 968, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": [ 969 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": [ 970 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 971 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953, 22, 971, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": [ 972 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 970, 972 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": [ 973 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973, 944 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": [ 974 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 954, 974 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": [ 975 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4081 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 978373884, 2097174, 524288, 0, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 4090 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4090 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4091 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4091 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 976 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 977 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 906, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 978 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977, 978, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": [ 979 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976, 979 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": [ 980 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946, 975, 980, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.8/self_attn/Reshape_7_output_0", "outputIndexes": [ 981 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 981 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4092 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4092 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4093 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4093 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 980995346, 8388630, 2097152, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 4094 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4094 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4095 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4095 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 982 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 982 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_output_0", "outputIndexes": [ 983 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 983 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 991481128, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 984 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4096 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4096 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4097 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4097 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 991513896, 25165846, 6291456, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 4098 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4098 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4099 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4099 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 985 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 985 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": [ 986 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4097 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1022971198, 25165846, 6291456, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 4102 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4102 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4103 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4103 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 987 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 986, 987 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": [ 988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 988 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4104 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4104 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4105 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4105 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1054428500, 25165846, 6291456, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 4106 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4106 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4107 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4107 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 983, 989 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_1_output_0", "outputIndexes": [ 990 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/Reshape_output_0", "outputIndexes": [ 991 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1085885802, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": [ 992 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4108 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4108 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4109 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4109 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1085918570, 8388630, 2097152, 0, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 4110 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4110 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4111 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4111 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 993 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": [ 994 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 994 ] , "main_type": "NONE", "name": "Shape3870", "outputIndexes": [ 995 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 994 ] , "main_type": "NONE", "name": "Rank3872", "outputIndexes": [ 996 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 996, 996 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3874", "outputIndexes": [ 997 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3875", "outputIndexes": [ 998 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3877", "outputIndexes": [ 999 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 999 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3878", "outputIndexes": [ 1000 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 995, 998, 1000, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3881", "outputIndexes": [ 1001 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3882", "outputIndexes": [ 1002 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 1002 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3884", "outputIndexes": [ 1003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994, 1003, 997 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": [ 1004 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1005 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3892", "outputIndexes": [ 1006 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 999 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3895", "outputIndexes": [ 1007 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 995, 1006, 1007, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3898", "outputIndexes": [ 1008 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1008 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3899", "outputIndexes": [ 1009 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1009 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3900", "outputIndexes": [ 1010 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1010, 1009 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3901", "outputIndexes": [ 1011 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994, 1011, 997 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": [ 1012 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1012, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1005, 1013, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": [ 1014 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 993, 1014 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": [ 1015 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1015 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1096404352, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.9/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1017 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3919", "outputIndexes": [ 1018 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3922", "outputIndexes": [ 1019 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1018, 1019, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3925", "outputIndexes": [ 1020 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1020 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3926", "outputIndexes": [ 1021 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1021, 1021 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3928", "outputIndexes": [ 1022 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1022, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": [ 1023 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 1023 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": [ 1024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": [ 1025 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1025 ] , "main_type": "NONE", "name": "Shape4052", "outputIndexes": [ 1026 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1025 ] , "main_type": "NONE", "name": "Rank4054", "outputIndexes": [ 1027 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027, 1027 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4056", "outputIndexes": [ 1028 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4057", "outputIndexes": [ 1029 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4059", "outputIndexes": [ 1030 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4060", "outputIndexes": [ 1031 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026, 1029, 1031, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4063", "outputIndexes": [ 1032 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1032 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4064", "outputIndexes": [ 1033 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1033 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4065", "outputIndexes": [ 1034 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1034, 1033 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4066", "outputIndexes": [ 1035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025, 1035, 1028 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_4_output_0", "outputIndexes": [ 1036 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": [ 1037 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1037, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1038 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 1038, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": [ 1039 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1039 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": [ 1040 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1037, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1041 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 22, 1041, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": [ 1042 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040, 1042 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": [ 1043 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3961", "outputIndexes": [ 1044 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3964", "outputIndexes": [ 1045 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1044, 1045, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3967", "outputIndexes": [ 1046 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3968", "outputIndexes": [ 1047 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1047 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3969", "outputIndexes": [ 1048 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 1047 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3970", "outputIndexes": [ 1049 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1049, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": [ 1050 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1043, 1050 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": [ 1051 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1024, 1051 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": [ 1052 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4109 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1096405376, 2097174, 524288, 0, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 4114 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4114 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4115 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4115 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1053 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1054 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1012, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 1055, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": [ 1056 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1053, 1056 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": [ 1057 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1057 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1099026838, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.9/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1059 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059, 1023 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": [ 1060 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": [ 1061 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1061 ] , "main_type": "NONE", "name": "Shape3932", "outputIndexes": [ 1062 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1061 ] , "main_type": "NONE", "name": "Rank3934", "outputIndexes": [ 1063 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 1063 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3936", "outputIndexes": [ 1064 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1064 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3937", "outputIndexes": [ 1065 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1064, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3939", "outputIndexes": [ 1066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3940", "outputIndexes": [ 1067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062, 1065, 1067, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3943", "outputIndexes": [ 1068 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1068 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3944", "outputIndexes": [ 1069 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1069 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3945", "outputIndexes": [ 1070 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1070, 1069 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3946", "outputIndexes": [ 1071 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061, 1071, 1064 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_5_output_0", "outputIndexes": [ 1072 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": [ 1073 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1074 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059, 1074, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": [ 1075 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": [ 1076 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1077 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059, 22, 1077, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": [ 1078 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 1078 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": [ 1079 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1079, 1050 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": [ 1080 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1060, 1080 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": [ 1081 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4109 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1099027862, 2097174, 524288, 0, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 4118 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4118 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4119 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4119 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1082 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1083 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1012, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1084 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083, 1084, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": [ 1085 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1082, 1085 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": [ 1086 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1052, 1081, 1086, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.9/self_attn/Reshape_7_output_0", "outputIndexes": [ 1087 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1087 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4120 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4120 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4121 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4121 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1101649324, 8388630, 2097152, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 4122 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4122 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4123 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4123 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1088 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991, 1088 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_output_0", "outputIndexes": [ 1089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1089 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1112135106, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1090 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4124 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4124 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4125 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4125 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1112167874, 25165846, 6291456, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 4126 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4126 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4127 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4127 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1091 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1091 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1092 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4125 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1143625176, 25165846, 6291456, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 4130 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4130 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4131 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4131 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092, 1093 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": [ 1094 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1094 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4132 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4132 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4133 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4133 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1175082478, 25165846, 6291456, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 4134 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4134 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4135 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4135 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1095 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1089, 1095 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_1_output_0", "outputIndexes": [ 1096 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1096, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/Reshape_output_0", "outputIndexes": [ 1097 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1097 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1206539780, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1098 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1098 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4136 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4136 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4137 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4137 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1206572548, 8388630, 2097152, 0, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 4138 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4138 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4139 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4139 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1099 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1098 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": [ 1100 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1100 ] , "main_type": "NONE", "name": "Shape4291", "outputIndexes": [ 1101 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1100 ] , "main_type": "NONE", "name": "Rank4293", "outputIndexes": [ 1102 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1102, 1102 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4295", "outputIndexes": [ 1103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4296", "outputIndexes": [ 1104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1103, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4298", "outputIndexes": [ 1105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1105 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4299", "outputIndexes": [ 1106 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1101, 1104, 1106, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4302", "outputIndexes": [ 1107 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1107 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4303", "outputIndexes": [ 1108 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108, 1108 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4305", "outputIndexes": [ 1109 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100, 1109, 1103 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": [ 1110 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1110, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1111 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4313", "outputIndexes": [ 1112 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1105 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4316", "outputIndexes": [ 1113 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1101, 1112, 1113, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4319", "outputIndexes": [ 1114 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4320", "outputIndexes": [ 1115 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1115 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4321", "outputIndexes": [ 1116 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1116, 1115 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4322", "outputIndexes": [ 1117 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100, 1117, 1103 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": [ 1118 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1119 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1111, 1119, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": [ 1120 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1099, 1120 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": [ 1121 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1121 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1217058330, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.10/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1123 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4340", "outputIndexes": [ 1124 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4343", "outputIndexes": [ 1125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1124, 1125, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4346", "outputIndexes": [ 1126 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1126 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4347", "outputIndexes": [ 1127 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 1127 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4349", "outputIndexes": [ 1128 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1128, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": [ 1129 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1123, 1129 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": [ 1130 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1123 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": [ 1131 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1131 ] , "main_type": "NONE", "name": "Shape4473", "outputIndexes": [ 1132 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1131 ] , "main_type": "NONE", "name": "Rank4475", "outputIndexes": [ 1133 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133, 1133 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4477", "outputIndexes": [ 1134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1134 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4478", "outputIndexes": [ 1135 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1134, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4480", "outputIndexes": [ 1136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1136 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4481", "outputIndexes": [ 1137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1132, 1135, 1137, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4484", "outputIndexes": [ 1138 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4485", "outputIndexes": [ 1139 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1139 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4486", "outputIndexes": [ 1140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 1139 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4487", "outputIndexes": [ 1141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131, 1141, 1134 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_4_output_0", "outputIndexes": [ 1142 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1142, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": [ 1143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1123, 1144, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": [ 1145 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": [ 1146 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1147 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1123, 22, 1147, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": [ 1148 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1146, 1148 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": [ 1149 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4382", "outputIndexes": [ 1150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4385", "outputIndexes": [ 1151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1150, 1151, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4388", "outputIndexes": [ 1152 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4389", "outputIndexes": [ 1153 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1153 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4390", "outputIndexes": [ 1154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 1153 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4391", "outputIndexes": [ 1155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1155, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": [ 1156 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 1156 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": [ 1157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1130, 1157 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": [ 1158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4137 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1217059354, 2097174, 524288, 0, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 4142 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4142 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4143 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4143 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1159 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1110, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1160 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1161 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1160, 1161, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": [ 1162 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1159, 1162 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": [ 1163 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1163 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1219680816, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.10/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1165 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1129 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": [ 1166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": [ 1167 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Shape4353", "outputIndexes": [ 1168 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Rank4355", "outputIndexes": [ 1169 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1169, 1169 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4357", "outputIndexes": [ 1170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4358", "outputIndexes": [ 1171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4360", "outputIndexes": [ 1172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4361", "outputIndexes": [ 1173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 1171, 1173, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4364", "outputIndexes": [ 1174 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1174 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4365", "outputIndexes": [ 1175 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4366", "outputIndexes": [ 1176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176, 1175 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4367", "outputIndexes": [ 1177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 1177, 1170 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_5_output_0", "outputIndexes": [ 1178 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1178, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": [ 1179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1180 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1180, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": [ 1181 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": [ 1182 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 22, 1183, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": [ 1184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1182, 1184 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": [ 1185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1185, 1156 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": [ 1186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1166, 1186 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": [ 1187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4137 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1219681840, 2097174, 524288, 0, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 4146 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4146 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4147 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4147 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1110, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1189, 1190, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": [ 1191 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 1191 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": [ 1192 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1158, 1187, 1192, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.10/self_attn/Reshape_7_output_0", "outputIndexes": [ 1193 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1193 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4148 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4148 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4149 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4149 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1222303302, 8388630, 2097152, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 4150 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4150 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4151 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4151 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1194 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1097, 1194 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_output_0", "outputIndexes": [ 1195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1232789084, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1196 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1196 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4152 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4152 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4153 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4153 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1232821852, 25165846, 6291456, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 4154 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4154 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4155 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4155 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1197 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1198 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4153 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1264279154, 25165846, 6291456, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 4158 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4158 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4159 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4159 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1199 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1198, 1199 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": [ 1200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1200 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4160 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4160 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4161 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4161 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1295736456, 25165846, 6291456, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 4162 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4162 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4163 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4163 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195, 1201 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_1_output_0", "outputIndexes": [ 1202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/Reshape_output_0", "outputIndexes": [ 1203 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1327193758, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1204 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4164 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4164 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4165 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4165 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1327226526, 8388630, 2097152, 0, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 4166 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4166 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4167 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4167 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": [ 1206 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Shape4712", "outputIndexes": [ 1207 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Rank4714", "outputIndexes": [ 1208 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 1208 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4716", "outputIndexes": [ 1209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4717", "outputIndexes": [ 1210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4719", "outputIndexes": [ 1211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4720", "outputIndexes": [ 1212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1210, 1212, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4723", "outputIndexes": [ 1213 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4724", "outputIndexes": [ 1214 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1214, 1214 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4726", "outputIndexes": [ 1215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1215, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": [ 1216 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1217 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4734", "outputIndexes": [ 1218 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4737", "outputIndexes": [ 1219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1218, 1219, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4740", "outputIndexes": [ 1220 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1220 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4741", "outputIndexes": [ 1221 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1221 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4742", "outputIndexes": [ 1222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222, 1221 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4743", "outputIndexes": [ 1223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1223, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": [ 1224 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1225 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 1225, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": [ 1226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205, 1226 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": [ 1227 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1337712308, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.11/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1229 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4761", "outputIndexes": [ 1230 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4764", "outputIndexes": [ 1231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1230, 1231, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4767", "outputIndexes": [ 1232 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4768", "outputIndexes": [ 1233 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1233, 1233 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4770", "outputIndexes": [ 1234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1234, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": [ 1235 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 1235 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": [ 1236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": [ 1237 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1237 ] , "main_type": "NONE", "name": "Shape4894", "outputIndexes": [ 1238 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1237 ] , "main_type": "NONE", "name": "Rank4896", "outputIndexes": [ 1239 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1239, 1239 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4898", "outputIndexes": [ 1240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4899", "outputIndexes": [ 1241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4901", "outputIndexes": [ 1242 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1242 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4902", "outputIndexes": [ 1243 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1238, 1241, 1243, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4905", "outputIndexes": [ 1244 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1244 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4906", "outputIndexes": [ 1245 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1245 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4907", "outputIndexes": [ 1246 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1246, 1245 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4908", "outputIndexes": [ 1247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1237, 1247, 1240 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_4_output_0", "outputIndexes": [ 1248 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1248, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": [ 1249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1250 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 1250, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": [ 1251 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1251 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": [ 1252 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 22, 1253, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": [ 1254 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1252, 1254 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": [ 1255 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4803", "outputIndexes": [ 1256 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4806", "outputIndexes": [ 1257 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1256, 1257, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4809", "outputIndexes": [ 1258 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4810", "outputIndexes": [ 1259 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1259 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4811", "outputIndexes": [ 1260 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1260, 1259 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4812", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1261, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": [ 1262 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1255, 1262 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": [ 1263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1236, 1263 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": [ 1264 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4165 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1337713332, 2097174, 524288, 0, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 4170 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4170 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4171 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4171 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1265 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1266 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1267 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1266, 1267, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": [ 1268 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1265, 1268 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": [ 1269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1269 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1340334794, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.11/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1271 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 1235 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": [ 1272 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": [ 1273 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1273 ] , "main_type": "NONE", "name": "Shape4774", "outputIndexes": [ 1274 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1273 ] , "main_type": "NONE", "name": "Rank4776", "outputIndexes": [ 1275 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1275, 1275 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4778", "outputIndexes": [ 1276 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4779", "outputIndexes": [ 1277 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4781", "outputIndexes": [ 1278 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1278 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4782", "outputIndexes": [ 1279 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1274, 1277, 1279, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4785", "outputIndexes": [ 1280 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1280 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4786", "outputIndexes": [ 1281 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1281 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4787", "outputIndexes": [ 1282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1282, 1281 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4788", "outputIndexes": [ 1283 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1273, 1283, 1276 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_5_output_0", "outputIndexes": [ 1284 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": [ 1285 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1286 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 1286, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": [ 1287 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1287 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": [ 1288 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1289 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 22, 1289, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": [ 1290 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1288, 1290 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": [ 1291 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1291, 1262 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": [ 1292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1272, 1292 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": [ 1293 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4165 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1340335818, 2097174, 524288, 0, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 4174 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4174 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4175 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4175 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1294 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1295 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1296 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 1296, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": [ 1297 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294, 1297 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": [ 1298 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1264, 1293, 1298, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.11/self_attn/Reshape_7_output_0", "outputIndexes": [ 1299 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1299 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4176 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4176 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4177 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4177 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1342957280, 8388630, 2097152, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 4178 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4178 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4179 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4179 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1300 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203, 1300 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_output_0", "outputIndexes": [ 1301 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1301 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1353443062, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1302 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1302 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4180 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4180 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4181 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4181 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1353475830, 25165846, 6291456, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 4182 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4182 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4183 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4183 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1303 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1303 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1304 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4181 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1384933132, 25165846, 6291456, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 4186 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4186 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4187 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4187 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1305 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1304, 1305 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": [ 1306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1306 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4188 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4189 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4189 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1416390434, 25165846, 6291456, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 4190 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4190 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4191 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4191 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1307 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1301, 1307 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_1_output_0", "outputIndexes": [ 1308 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1308, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/Reshape_output_0", "outputIndexes": [ 1309 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1309 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1447847736, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1310 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4192 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4192 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4193 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4193 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1447880504, 8388630, 2097152, 0, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 4194 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4194 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4195 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4195 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1311 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": [ 1312 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1312 ] , "main_type": "NONE", "name": "Shape5133", "outputIndexes": [ 1313 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1312 ] , "main_type": "NONE", "name": "Rank5135", "outputIndexes": [ 1314 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1314, 1314 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5137", "outputIndexes": [ 1315 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5138", "outputIndexes": [ 1316 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5140", "outputIndexes": [ 1317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5141", "outputIndexes": [ 1318 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 1316, 1318, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5144", "outputIndexes": [ 1319 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5145", "outputIndexes": [ 1320 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320, 1320 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5147", "outputIndexes": [ 1321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1312, 1321, 1315 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": [ 1322 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1323 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5155", "outputIndexes": [ 1324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5158", "outputIndexes": [ 1325 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 1324, 1325, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5161", "outputIndexes": [ 1326 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1326 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5162", "outputIndexes": [ 1327 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1327 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5163", "outputIndexes": [ 1328 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1328, 1327 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5164", "outputIndexes": [ 1329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1312, 1329, 1315 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": [ 1330 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1331 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323, 1331, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": [ 1332 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311, 1332 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": [ 1333 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1333 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1458366286, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.12/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1335 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5182", "outputIndexes": [ 1336 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5185", "outputIndexes": [ 1337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1336, 1337, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5188", "outputIndexes": [ 1338 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5189", "outputIndexes": [ 1339 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1339, 1339 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5191", "outputIndexes": [ 1340 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1340, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": [ 1341 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 1341 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": [ 1342 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": [ 1343 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1343 ] , "main_type": "NONE", "name": "Shape5315", "outputIndexes": [ 1344 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1343 ] , "main_type": "NONE", "name": "Rank5317", "outputIndexes": [ 1345 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 1345 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5319", "outputIndexes": [ 1346 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1346 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5320", "outputIndexes": [ 1347 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1346, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5322", "outputIndexes": [ 1348 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5323", "outputIndexes": [ 1349 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1344, 1347, 1349, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5326", "outputIndexes": [ 1350 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5327", "outputIndexes": [ 1351 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1351 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5328", "outputIndexes": [ 1352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352, 1351 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5329", "outputIndexes": [ 1353 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 1353, 1346 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_4_output_0", "outputIndexes": [ 1354 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": [ 1355 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1355, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1356 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 1356, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": [ 1357 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": [ 1358 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1355, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1359 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 22, 1359, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": [ 1360 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1358, 1360 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": [ 1361 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5224", "outputIndexes": [ 1362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5227", "outputIndexes": [ 1363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1362, 1363, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5230", "outputIndexes": [ 1364 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1364 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5231", "outputIndexes": [ 1365 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1365 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5232", "outputIndexes": [ 1366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1366, 1365 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5233", "outputIndexes": [ 1367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1367, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": [ 1368 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1361, 1368 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": [ 1369 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1342, 1369 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": [ 1370 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4193 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1458367310, 2097174, 524288, 0, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 4198 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4198 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4199 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4199 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1371 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1372 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1373 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1372, 1373, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": [ 1374 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1371, 1374 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": [ 1375 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1460988772, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.12/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1377 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377, 1341 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": [ 1378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": [ 1379 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1379 ] , "main_type": "NONE", "name": "Shape5195", "outputIndexes": [ 1380 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1379 ] , "main_type": "NONE", "name": "Rank5197", "outputIndexes": [ 1381 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381, 1381 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5199", "outputIndexes": [ 1382 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5200", "outputIndexes": [ 1383 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5202", "outputIndexes": [ 1384 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5203", "outputIndexes": [ 1385 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1380, 1383, 1385, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5206", "outputIndexes": [ 1386 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5207", "outputIndexes": [ 1387 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1387 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5208", "outputIndexes": [ 1388 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1388, 1387 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5209", "outputIndexes": [ 1389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1379, 1389, 1382 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_5_output_0", "outputIndexes": [ 1390 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1390, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": [ 1391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377, 1392, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": [ 1393 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1393 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": [ 1394 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1395 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377, 22, 1395, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": [ 1396 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 1396 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": [ 1397 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1397, 1368 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": [ 1398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378, 1398 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": [ 1399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4193 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1460989796, 2097174, 524288, 0, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 4202 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4202 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4203 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4203 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1400 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1401 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1402 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1401, 1402, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": [ 1403 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1400, 1403 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": [ 1404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1370, 1399, 1404, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.12/self_attn/Reshape_7_output_0", "outputIndexes": [ 1405 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4204 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4204 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4205 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4205 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1463611258, 8388630, 2097152, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 4206 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4206 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4207 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4207 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1406 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1309, 1406 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_output_0", "outputIndexes": [ 1407 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1474097040, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1408 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4208 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4208 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4209 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4209 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1474129808, 25165846, 6291456, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 4210 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4210 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4211 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4211 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1409 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1410 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4209 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1505587110, 25165846, 6291456, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 4214 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4214 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4215 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4215 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1411 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 1411 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": [ 1412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4216 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4216 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4217 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4217 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1537044412, 25165846, 6291456, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 4218 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4218 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4219 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4219 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1413 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1413 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_1_output_0", "outputIndexes": [ 1414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1414, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/Reshape_output_0", "outputIndexes": [ 1415 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1415 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1568501714, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1416 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4220 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4220 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4221 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4221 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1568534482, 8388630, 2097152, 0, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 4222 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4222 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4223 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4223 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1417 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": [ 1418 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1418 ] , "main_type": "NONE", "name": "Shape5554", "outputIndexes": [ 1419 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1418 ] , "main_type": "NONE", "name": "Rank5556", "outputIndexes": [ 1420 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 1420 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5558", "outputIndexes": [ 1421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5559", "outputIndexes": [ 1422 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5561", "outputIndexes": [ 1423 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1423 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5562", "outputIndexes": [ 1424 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 1422, 1424, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5565", "outputIndexes": [ 1425 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1425 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5566", "outputIndexes": [ 1426 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1426, 1426 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5568", "outputIndexes": [ 1427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 1427, 1421 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": [ 1428 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5576", "outputIndexes": [ 1430 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1423 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5579", "outputIndexes": [ 1431 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 1430, 1431, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5582", "outputIndexes": [ 1432 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5583", "outputIndexes": [ 1433 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1433 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5584", "outputIndexes": [ 1434 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 1433 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5585", "outputIndexes": [ 1435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 1435, 1421 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": [ 1436 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1437 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1429, 1437, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": [ 1438 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1417, 1438 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": [ 1439 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1439 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1579020264, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.13/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1441 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5603", "outputIndexes": [ 1442 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5606", "outputIndexes": [ 1443 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1442, 1443, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5609", "outputIndexes": [ 1444 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1444 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5610", "outputIndexes": [ 1445 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 1445 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5612", "outputIndexes": [ 1446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1446, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": [ 1447 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441, 1447 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": [ 1448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": [ 1449 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1449 ] , "main_type": "NONE", "name": "Shape5736", "outputIndexes": [ 1450 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1449 ] , "main_type": "NONE", "name": "Rank5738", "outputIndexes": [ 1451 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1451, 1451 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5740", "outputIndexes": [ 1452 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1452 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5741", "outputIndexes": [ 1453 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1452, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5743", "outputIndexes": [ 1454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1454 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5744", "outputIndexes": [ 1455 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1450, 1453, 1455, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5747", "outputIndexes": [ 1456 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1456 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5748", "outputIndexes": [ 1457 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1457 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5749", "outputIndexes": [ 1458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1458, 1457 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5750", "outputIndexes": [ 1459 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449, 1459, 1452 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_4_output_0", "outputIndexes": [ 1460 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1460, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": [ 1461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1461, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1462 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441, 1462, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": [ 1463 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1463 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": [ 1464 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1461, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1465 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441, 22, 1465, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": [ 1466 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464, 1466 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": [ 1467 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5645", "outputIndexes": [ 1468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5648", "outputIndexes": [ 1469 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1468, 1469, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5651", "outputIndexes": [ 1470 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5652", "outputIndexes": [ 1471 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1471 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5653", "outputIndexes": [ 1472 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472, 1471 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5654", "outputIndexes": [ 1473 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1473, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": [ 1474 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 1474 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": [ 1475 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1448, 1475 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": [ 1476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4221 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1579021288, 2097174, 524288, 0, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 4226 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4226 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4227 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4227 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1477 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1478 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478, 1479, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": [ 1480 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1477, 1480 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": [ 1481 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1481 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1581642750, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.13/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1483 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 1447 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": [ 1484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": [ 1485 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1485 ] , "main_type": "NONE", "name": "Shape5616", "outputIndexes": [ 1486 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1485 ] , "main_type": "NONE", "name": "Rank5618", "outputIndexes": [ 1487 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1487, 1487 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5620", "outputIndexes": [ 1488 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1488 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5621", "outputIndexes": [ 1489 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1488, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5623", "outputIndexes": [ 1490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1490 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5624", "outputIndexes": [ 1491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1486, 1489, 1491, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5627", "outputIndexes": [ 1492 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1492 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5628", "outputIndexes": [ 1493 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1493 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5629", "outputIndexes": [ 1494 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 1493 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5630", "outputIndexes": [ 1495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1485, 1495, 1488 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_5_output_0", "outputIndexes": [ 1496 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": [ 1497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 1498, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": [ 1499 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": [ 1500 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1501 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 22, 1501, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": [ 1502 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1500, 1502 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": [ 1503 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503, 1474 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": [ 1504 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1484, 1504 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": [ 1505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4221 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1581643774, 2097174, 524288, 0, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 4230 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4230 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4231 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4231 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1506 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1507 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1507, 1508, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": [ 1509 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1506, 1509 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": [ 1510 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 1505, 1510, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.13/self_attn/Reshape_7_output_0", "outputIndexes": [ 1511 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1511 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4232 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4232 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4233 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4233 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1584265236, 8388630, 2097152, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 4234 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4234 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4235 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4235 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1512 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1415, 1512 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_output_0", "outputIndexes": [ 1513 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1594751018, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1514 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1514 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4236 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4236 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4237 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4237 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1594783786, 25165846, 6291456, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 4238 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4238 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4239 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4239 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1515 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1515 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1516 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4237 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1626241088, 25165846, 6291456, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 4242 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4242 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4243 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4243 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1516, 1517 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": [ 1518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1518 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4244 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4244 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4245 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4245 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1657698390, 25165846, 6291456, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 4246 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4246 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4247 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4247 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1519 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 1519 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_1_output_0", "outputIndexes": [ 1520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1520, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/Reshape_output_0", "outputIndexes": [ 1521 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1689155692, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1522 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1522 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4248 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4248 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4249 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4249 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1689188460, 8388630, 2097152, 0, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 4250 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4250 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4251 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4251 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1522 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": [ 1524 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1524 ] , "main_type": "NONE", "name": "Shape5975", "outputIndexes": [ 1525 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1524 ] , "main_type": "NONE", "name": "Rank5977", "outputIndexes": [ 1526 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 1526 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5979", "outputIndexes": [ 1527 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5980", "outputIndexes": [ 1528 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5982", "outputIndexes": [ 1529 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1529 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5983", "outputIndexes": [ 1530 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1525, 1528, 1530, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5986", "outputIndexes": [ 1531 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1531 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5987", "outputIndexes": [ 1532 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1532, 1532 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5989", "outputIndexes": [ 1533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524, 1533, 1527 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": [ 1534 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1535 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5997", "outputIndexes": [ 1536 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1529 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6000", "outputIndexes": [ 1537 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1525, 1536, 1537, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6003", "outputIndexes": [ 1538 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1538 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6004", "outputIndexes": [ 1539 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1539 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6005", "outputIndexes": [ 1540 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540, 1539 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6006", "outputIndexes": [ 1541 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524, 1541, 1527 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": [ 1542 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1543 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535, 1543, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": [ 1544 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 1544 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": [ 1545 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1545 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1699674242, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.14/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1547 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6024", "outputIndexes": [ 1548 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6027", "outputIndexes": [ 1549 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1548, 1549, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6030", "outputIndexes": [ 1550 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1550 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6031", "outputIndexes": [ 1551 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551, 1551 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6033", "outputIndexes": [ 1552 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1552, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": [ 1553 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 1553 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": [ 1554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": [ 1555 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1555 ] , "main_type": "NONE", "name": "Shape6157", "outputIndexes": [ 1556 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1555 ] , "main_type": "NONE", "name": "Rank6159", "outputIndexes": [ 1557 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1557, 1557 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6161", "outputIndexes": [ 1558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6162", "outputIndexes": [ 1559 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6164", "outputIndexes": [ 1560 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6165", "outputIndexes": [ 1561 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1556, 1559, 1561, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6168", "outputIndexes": [ 1562 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6169", "outputIndexes": [ 1563 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1563 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6170", "outputIndexes": [ 1564 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1563 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6171", "outputIndexes": [ 1565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 1565, 1558 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_4_output_0", "outputIndexes": [ 1566 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1566, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 1568, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": [ 1569 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": [ 1570 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1571 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 22, 1571, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": [ 1572 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1570, 1572 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": [ 1573 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6066", "outputIndexes": [ 1574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6069", "outputIndexes": [ 1575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1574, 1575, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6072", "outputIndexes": [ 1576 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1576 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6073", "outputIndexes": [ 1577 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1577 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6074", "outputIndexes": [ 1578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1578, 1577 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6075", "outputIndexes": [ 1579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1579, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": [ 1580 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1573, 1580 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": [ 1581 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1554, 1581 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": [ 1582 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4249 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1699675266, 2097174, 524288, 0, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 4254 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4254 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4255 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4255 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1584 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1585 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1584, 1585, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": [ 1586 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 1586 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": [ 1587 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1702296728, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.14/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1589 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 1553 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": [ 1591 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1591 ] , "main_type": "NONE", "name": "Shape6037", "outputIndexes": [ 1592 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1591 ] , "main_type": "NONE", "name": "Rank6039", "outputIndexes": [ 1593 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1593, 1593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6041", "outputIndexes": [ 1594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6042", "outputIndexes": [ 1595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6044", "outputIndexes": [ 1596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6045", "outputIndexes": [ 1597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592, 1595, 1597, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6048", "outputIndexes": [ 1598 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1598 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6049", "outputIndexes": [ 1599 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1599 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6050", "outputIndexes": [ 1600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1600, 1599 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6051", "outputIndexes": [ 1601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1591, 1601, 1594 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_5_output_0", "outputIndexes": [ 1602 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1602, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": [ 1603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1604 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 1604, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": [ 1605 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1605 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": [ 1606 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 22, 1607, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": [ 1608 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 1608 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": [ 1609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1609, 1580 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": [ 1610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590, 1610 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": [ 1611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4249 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1702297752, 2097174, 524288, 0, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 4258 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4258 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4259 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4259 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1613 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1613, 1614, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": [ 1615 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1615 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": [ 1616 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1582, 1611, 1616, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.14/self_attn/Reshape_7_output_0", "outputIndexes": [ 1617 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4260 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4260 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4261 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4261 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1704919214, 8388630, 2097152, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 4262 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4262 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4263 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4263 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 1618 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_output_0", "outputIndexes": [ 1619 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1715404996, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1620 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1620 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4264 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4264 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4265 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4265 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1715437764, 25165846, 6291456, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 4266 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4266 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4267 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4267 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1621 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1622 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4265 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1746895066, 25165846, 6291456, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 4270 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4270 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4271 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4271 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1622, 1623 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4272 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4272 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4273 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4273 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1778352368, 25165846, 6291456, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 4274 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4274 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4275 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4275 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1625 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619, 1625 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_1_output_0", "outputIndexes": [ 1626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/Reshape_output_0", "outputIndexes": [ 1627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1809809670, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1628 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4276 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4276 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4277 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4277 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1809842438, 8388630, 2097152, 0, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 4278 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4278 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4279 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4279 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": [ 1630 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1630 ] , "main_type": "NONE", "name": "Shape6396", "outputIndexes": [ 1631 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1630 ] , "main_type": "NONE", "name": "Rank6398", "outputIndexes": [ 1632 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1632, 1632 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6400", "outputIndexes": [ 1633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6401", "outputIndexes": [ 1634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6403", "outputIndexes": [ 1635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6404", "outputIndexes": [ 1636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1631, 1634, 1636, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6407", "outputIndexes": [ 1637 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1637 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6408", "outputIndexes": [ 1638 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1638, 1638 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6410", "outputIndexes": [ 1639 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 1639, 1633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": [ 1640 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1641 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6418", "outputIndexes": [ 1642 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6421", "outputIndexes": [ 1643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1631, 1642, 1643, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6424", "outputIndexes": [ 1644 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1644 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6425", "outputIndexes": [ 1645 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1645 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6426", "outputIndexes": [ 1646 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1646, 1645 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6427", "outputIndexes": [ 1647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 1647, 1633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": [ 1648 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1641, 1649, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": [ 1650 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1629, 1650 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": [ 1651 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1820328220, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.15/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1653 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6445", "outputIndexes": [ 1654 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6448", "outputIndexes": [ 1655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1654, 1655, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6451", "outputIndexes": [ 1656 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6452", "outputIndexes": [ 1657 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1657, 1657 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6454", "outputIndexes": [ 1658 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1658, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": [ 1659 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1659 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": [ 1660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": [ 1661 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1661 ] , "main_type": "NONE", "name": "Shape6578", "outputIndexes": [ 1662 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1661 ] , "main_type": "NONE", "name": "Rank6580", "outputIndexes": [ 1663 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1663, 1663 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6582", "outputIndexes": [ 1664 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1664 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6583", "outputIndexes": [ 1665 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1664, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6585", "outputIndexes": [ 1666 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1666 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6586", "outputIndexes": [ 1667 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662, 1665, 1667, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6589", "outputIndexes": [ 1668 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1668 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6590", "outputIndexes": [ 1669 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1669 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6591", "outputIndexes": [ 1670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1670, 1669 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6592", "outputIndexes": [ 1671 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 1671, 1664 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_4_output_0", "outputIndexes": [ 1672 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": [ 1673 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1673, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1674 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1674, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": [ 1675 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1675 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": [ 1676 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1673, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 22, 1677, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": [ 1678 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676, 1678 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": [ 1679 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6487", "outputIndexes": [ 1680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6490", "outputIndexes": [ 1681 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1680, 1681, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6493", "outputIndexes": [ 1682 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1682 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6494", "outputIndexes": [ 1683 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1683 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6495", "outputIndexes": [ 1684 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1684, 1683 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6496", "outputIndexes": [ 1685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1685, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": [ 1686 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679, 1686 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": [ 1687 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1660, 1687 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": [ 1688 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4277 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1820329244, 2097174, 524288, 0, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 4282 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4282 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4283 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4283 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1689 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1690 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1691 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1690, 1691, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": [ 1692 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689, 1692 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": [ 1693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1693 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1822950706, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.15/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1695 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 1659 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": [ 1696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": [ 1697 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1697 ] , "main_type": "NONE", "name": "Shape6458", "outputIndexes": [ 1698 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1697 ] , "main_type": "NONE", "name": "Rank6460", "outputIndexes": [ 1699 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 1699 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6462", "outputIndexes": [ 1700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1700 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6463", "outputIndexes": [ 1701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1700, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6465", "outputIndexes": [ 1702 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1702 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6466", "outputIndexes": [ 1703 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1698, 1701, 1703, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6469", "outputIndexes": [ 1704 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6470", "outputIndexes": [ 1705 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1705 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6471", "outputIndexes": [ 1706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706, 1705 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6472", "outputIndexes": [ 1707 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1697, 1707, 1700 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_5_output_0", "outputIndexes": [ 1708 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1708, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": [ 1709 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1709, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1710 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 1710, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": [ 1711 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1711 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": [ 1712 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1709, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1713 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 22, 1713, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": [ 1714 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 1714 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": [ 1715 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715, 1686 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": [ 1716 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 1716 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": [ 1717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4277 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1822951730, 2097174, 524288, 0, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 4286 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4286 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4287 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4287 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1719 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1720 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1719, 1720, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": [ 1721 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1718, 1721 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": [ 1722 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688, 1717, 1722, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.15/self_attn/Reshape_7_output_0", "outputIndexes": [ 1723 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4288 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4288 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4289 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4289 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1825573192, 8388630, 2097152, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 4290 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4290 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4291 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4291 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1724 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627, 1724 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_output_0", "outputIndexes": [ 1725 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1725 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1836058974, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1726 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4292 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4292 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4293 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4293 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1836091742, 25165846, 6291456, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 4294 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4294 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4295 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4295 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1727 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1727 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1728 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4293 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1867549044, 25165846, 6291456, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 4298 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4298 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4299 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4299 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1729 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1728, 1729 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": [ 1730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1730 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4300 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4300 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4301 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4301 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1899006346, 25165846, 6291456, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 4302 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4302 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4303 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4303 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1731 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1725, 1731 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_1_output_0", "outputIndexes": [ 1732 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1732, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/Reshape_output_0", "outputIndexes": [ 1733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1930463648, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1734 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4304 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4304 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4305 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4305 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1930496416, 8388630, 2097152, 0, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 4306 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4306 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4307 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4307 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": [ 1736 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1736 ] , "main_type": "NONE", "name": "Shape6817", "outputIndexes": [ 1737 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1736 ] , "main_type": "NONE", "name": "Rank6819", "outputIndexes": [ 1738 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738, 1738 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6821", "outputIndexes": [ 1739 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6822", "outputIndexes": [ 1740 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6824", "outputIndexes": [ 1741 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6825", "outputIndexes": [ 1742 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737, 1740, 1742, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6828", "outputIndexes": [ 1743 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6829", "outputIndexes": [ 1744 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1744, 1744 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6831", "outputIndexes": [ 1745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736, 1745, 1739 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": [ 1746 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1747 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6839", "outputIndexes": [ 1748 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6842", "outputIndexes": [ 1749 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737, 1748, 1749, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6845", "outputIndexes": [ 1750 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6846", "outputIndexes": [ 1751 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1751 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6847", "outputIndexes": [ 1752 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1752, 1751 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6848", "outputIndexes": [ 1753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736, 1753, 1739 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": [ 1754 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1755 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747, 1755, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": [ 1756 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1735, 1756 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": [ 1757 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1757 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1940982198, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.16/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1759 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6866", "outputIndexes": [ 1760 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6869", "outputIndexes": [ 1761 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1760, 1761, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6872", "outputIndexes": [ 1762 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1762 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6873", "outputIndexes": [ 1763 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 1763 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6875", "outputIndexes": [ 1764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1764, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": [ 1765 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1759, 1765 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": [ 1766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1759 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": [ 1767 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1767 ] , "main_type": "NONE", "name": "Shape6999", "outputIndexes": [ 1768 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1767 ] , "main_type": "NONE", "name": "Rank7001", "outputIndexes": [ 1769 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1769, 1769 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7003", "outputIndexes": [ 1770 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7004", "outputIndexes": [ 1771 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7006", "outputIndexes": [ 1772 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1772 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7007", "outputIndexes": [ 1773 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768, 1771, 1773, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7010", "outputIndexes": [ 1774 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1774 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7011", "outputIndexes": [ 1775 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1775 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7012", "outputIndexes": [ 1776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1776, 1775 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7013", "outputIndexes": [ 1777 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1767, 1777, 1770 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_4_output_0", "outputIndexes": [ 1778 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1778, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": [ 1779 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1780 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1759, 1780, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": [ 1781 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1781 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": [ 1782 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1783 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1759, 22, 1783, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": [ 1784 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1782, 1784 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": [ 1785 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6908", "outputIndexes": [ 1786 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6911", "outputIndexes": [ 1787 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1786, 1787, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6914", "outputIndexes": [ 1788 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6915", "outputIndexes": [ 1789 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1789 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6916", "outputIndexes": [ 1790 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 1789 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6917", "outputIndexes": [ 1791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1791, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": [ 1792 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785, 1792 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": [ 1793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766, 1793 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": [ 1794 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4305 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1940983222, 2097174, 524288, 0, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 4310 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4310 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4311 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4311 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1795 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1796 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1796, 1797, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": [ 1798 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795, 1798 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": [ 1799 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1799 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1943604684, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.16/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1801 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 1765 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": [ 1802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": [ 1803 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1803 ] , "main_type": "NONE", "name": "Shape6879", "outputIndexes": [ 1804 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1803 ] , "main_type": "NONE", "name": "Rank6881", "outputIndexes": [ 1805 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 1805 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6883", "outputIndexes": [ 1806 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1806 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6884", "outputIndexes": [ 1807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1806, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6886", "outputIndexes": [ 1808 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1808 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6887", "outputIndexes": [ 1809 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1804, 1807, 1809, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6890", "outputIndexes": [ 1810 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1810 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6891", "outputIndexes": [ 1811 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1811 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6892", "outputIndexes": [ 1812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1812, 1811 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6893", "outputIndexes": [ 1813 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1803, 1813, 1806 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_5_output_0", "outputIndexes": [ 1814 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1814, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": [ 1815 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1815, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1816 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 1816, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": [ 1817 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1817 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": [ 1818 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1815, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1819 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 22, 1819, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": [ 1820 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818, 1820 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": [ 1821 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821, 1792 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": [ 1822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1802, 1822 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": [ 1823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4305 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1943605708, 2097174, 524288, 0, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 4314 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4314 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4315 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4315 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1824 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1825 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1826 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1825, 1826, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": [ 1827 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1824, 1827 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": [ 1828 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1794, 1823, 1828, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.16/self_attn/Reshape_7_output_0", "outputIndexes": [ 1829 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4316 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4317 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4317 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1946227170, 8388630, 2097152, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 4318 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4318 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4319 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4319 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1830 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733, 1830 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_output_0", "outputIndexes": [ 1831 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1956712952, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1832 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4320 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4320 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4321 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4321 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1956745720, 25165846, 6291456, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 4322 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4322 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4323 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4323 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1833 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1833 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1834 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4321 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1988203022, 25165846, 6291456, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 4326 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4326 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4327 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4327 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1835 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 1835 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": [ 1836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4328 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4328 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4329 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4329 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2019660324, 25165846, 6291456, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 4330 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4330 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4331 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4331 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1837 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831, 1837 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_1_output_0", "outputIndexes": [ 1838 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1838, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/Reshape_output_0", "outputIndexes": [ 1839 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2051117626, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1840 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1840 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4332 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4332 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4333 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4333 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2051150394, 8388630, 2097152, 0, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 4334 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4334 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4335 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4335 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1841 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1840 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": [ 1842 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1842 ] , "main_type": "NONE", "name": "Shape7238", "outputIndexes": [ 1843 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1842 ] , "main_type": "NONE", "name": "Rank7240", "outputIndexes": [ 1844 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1844, 1844 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7242", "outputIndexes": [ 1845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7243", "outputIndexes": [ 1846 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7245", "outputIndexes": [ 1847 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7246", "outputIndexes": [ 1848 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843, 1846, 1848, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7249", "outputIndexes": [ 1849 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1849 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7250", "outputIndexes": [ 1850 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 1850 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7252", "outputIndexes": [ 1851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1842, 1851, 1845 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": [ 1852 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1853 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7260", "outputIndexes": [ 1854 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7263", "outputIndexes": [ 1855 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843, 1854, 1855, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7266", "outputIndexes": [ 1856 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1856 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7267", "outputIndexes": [ 1857 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1857 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7268", "outputIndexes": [ 1858 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1858, 1857 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7269", "outputIndexes": [ 1859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1842, 1859, 1845 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": [ 1860 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1860, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1861 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 1861, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": [ 1862 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841, 1862 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": [ 1863 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1863 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2061636176, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.17/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1865 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7287", "outputIndexes": [ 1866 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7290", "outputIndexes": [ 1867 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1866, 1867, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7293", "outputIndexes": [ 1868 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7294", "outputIndexes": [ 1869 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1869, 1869 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7296", "outputIndexes": [ 1870 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1870, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": [ 1871 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865, 1871 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": [ 1872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": [ 1873 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1873 ] , "main_type": "NONE", "name": "Shape7420", "outputIndexes": [ 1874 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1873 ] , "main_type": "NONE", "name": "Rank7422", "outputIndexes": [ 1875 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1875, 1875 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7424", "outputIndexes": [ 1876 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1876 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7425", "outputIndexes": [ 1877 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1876, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7427", "outputIndexes": [ 1878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7428", "outputIndexes": [ 1879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1874, 1877, 1879, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7431", "outputIndexes": [ 1880 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7432", "outputIndexes": [ 1881 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1881 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7433", "outputIndexes": [ 1882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 1881 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7434", "outputIndexes": [ 1883 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873, 1883, 1876 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_4_output_0", "outputIndexes": [ 1884 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": [ 1885 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865, 1886, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": [ 1887 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1887 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": [ 1888 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1889 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865, 22, 1889, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": [ 1890 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1888, 1890 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": [ 1891 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7329", "outputIndexes": [ 1892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7332", "outputIndexes": [ 1893 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1892, 1893, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7335", "outputIndexes": [ 1894 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1894 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7336", "outputIndexes": [ 1895 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1895 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7337", "outputIndexes": [ 1896 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1896, 1895 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7338", "outputIndexes": [ 1897 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1897, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": [ 1898 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 1898 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": [ 1899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 1899 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": [ 1900 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4333 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2061637200, 2097174, 524288, 0, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 4338 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4338 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4339 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4339 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1901 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1902 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1860, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1903 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1902, 1903, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": [ 1904 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1901, 1904 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": [ 1905 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1905 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2064258662, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.17/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1907 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907, 1871 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": [ 1908 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": [ 1909 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1909 ] , "main_type": "NONE", "name": "Shape7300", "outputIndexes": [ 1910 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1909 ] , "main_type": "NONE", "name": "Rank7302", "outputIndexes": [ 1911 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1911, 1911 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7304", "outputIndexes": [ 1912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7305", "outputIndexes": [ 1913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7307", "outputIndexes": [ 1914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7308", "outputIndexes": [ 1915 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910, 1913, 1915, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7311", "outputIndexes": [ 1916 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7312", "outputIndexes": [ 1917 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1917 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7313", "outputIndexes": [ 1918 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 1917 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7314", "outputIndexes": [ 1919 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909, 1919, 1912 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_5_output_0", "outputIndexes": [ 1920 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": [ 1921 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907, 1922, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": [ 1923 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": [ 1924 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1925 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907, 22, 1925, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": [ 1926 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1924, 1926 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": [ 1927 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 1898 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": [ 1928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1908, 1928 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": [ 1929 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4333 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2064259686, 2097174, 524288, 0, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 4342 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4342 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4343 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4343 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1930 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1931 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1860, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1932 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1931, 1932, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": [ 1933 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930, 1933 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": [ 1934 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1900, 1929, 1934, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.17/self_attn/Reshape_7_output_0", "outputIndexes": [ 1935 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1935 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4344 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4344 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4345 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4345 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2066881148, 8388630, 2097152, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 4346 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4346 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4347 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4347 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 1936 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_output_0", "outputIndexes": [ 1937 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1937 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2077366930, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1938 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1938 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4348 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4348 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4349 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4349 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2077399698, 25165846, 6291456, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 4350 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4350 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4351 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4351 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1939 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1940 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4349 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2108857000, 25165846, 6291456, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 4354 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4354 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4355 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4355 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1941 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1940, 1941 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": [ 1942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1942 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4356 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4356 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4357 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4357 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2140314302, 25165846, 6291456, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 4358 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4358 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4359 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4359 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1943 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1937, 1943 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_1_output_0", "outputIndexes": [ 1944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/Reshape_output_0", "outputIndexes": [ 1945 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1945 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2171771604, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1946 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4360 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4361 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4361 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2171804372, 8388630, 2097152, 0, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 4362 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4362 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4363 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4363 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1947 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": [ 1948 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1948 ] , "main_type": "NONE", "name": "Shape7659", "outputIndexes": [ 1949 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1948 ] , "main_type": "NONE", "name": "Rank7661", "outputIndexes": [ 1950 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1950, 1950 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7663", "outputIndexes": [ 1951 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1951 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7664", "outputIndexes": [ 1952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1951, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7666", "outputIndexes": [ 1953 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7667", "outputIndexes": [ 1954 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1949, 1952, 1954, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7670", "outputIndexes": [ 1955 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7671", "outputIndexes": [ 1956 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1956, 1956 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7673", "outputIndexes": [ 1957 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948, 1957, 1951 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": [ 1958 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1958, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1959 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1951 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7681", "outputIndexes": [ 1960 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7684", "outputIndexes": [ 1961 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1949, 1960, 1961, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7687", "outputIndexes": [ 1962 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1962 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7688", "outputIndexes": [ 1963 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1963 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7689", "outputIndexes": [ 1964 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1964, 1963 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7690", "outputIndexes": [ 1965 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948, 1965, 1951 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": [ 1966 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1967 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1959, 1967, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": [ 1968 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1947, 1968 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": [ 1969 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2182290154, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.18/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1971 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7708", "outputIndexes": [ 1972 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7711", "outputIndexes": [ 1973 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1972, 1973, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7714", "outputIndexes": [ 1974 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1974 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7715", "outputIndexes": [ 1975 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975, 1975 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7717", "outputIndexes": [ 1976 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 1976, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": [ 1977 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 1977 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": [ 1978 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": [ 1979 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1979 ] , "main_type": "NONE", "name": "Shape7841", "outputIndexes": [ 1980 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1979 ] , "main_type": "NONE", "name": "Rank7843", "outputIndexes": [ 1981 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1981, 1981 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7845", "outputIndexes": [ 1982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7846", "outputIndexes": [ 1983 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7848", "outputIndexes": [ 1984 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1984 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7849", "outputIndexes": [ 1985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1980, 1983, 1985, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7852", "outputIndexes": [ 1986 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7853", "outputIndexes": [ 1987 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 1987 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7854", "outputIndexes": [ 1988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1988, 1987 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7855", "outputIndexes": [ 1989 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1979, 1989, 1982 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_4_output_0", "outputIndexes": [ 1990 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1990, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": [ 1991 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1992 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 1992, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": [ 1993 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1993 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": [ 1994 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1995 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 22, 1995, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": [ 1996 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1994, 1996 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": [ 1997 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7750", "outputIndexes": [ 1998 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7753", "outputIndexes": [ 1999 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 1998, 1999, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7756", "outputIndexes": [ 2000 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2000 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7757", "outputIndexes": [ 2001 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2001 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7758", "outputIndexes": [ 2002 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2002, 2001 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7759", "outputIndexes": [ 2003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2003, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": [ 2004 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1997, 2004 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": [ 2005 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1978, 2005 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": [ 2006 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4361 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2182291178, 2097174, 524288, 0, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 4366 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4366 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4367 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4367 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2007 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1958, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2008 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2009 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2009, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": [ 2010 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007, 2010 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": [ 2011 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2011 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2184912640, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.18/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2013 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013, 1977 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": [ 2014 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": [ 2015 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2015 ] , "main_type": "NONE", "name": "Shape7721", "outputIndexes": [ 2016 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2015 ] , "main_type": "NONE", "name": "Rank7723", "outputIndexes": [ 2017 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 2017 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7725", "outputIndexes": [ 2018 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7726", "outputIndexes": [ 2019 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7728", "outputIndexes": [ 2020 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7729", "outputIndexes": [ 2021 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2016, 2019, 2021, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7732", "outputIndexes": [ 2022 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2022 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7733", "outputIndexes": [ 2023 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2023 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7734", "outputIndexes": [ 2024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2024, 2023 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7735", "outputIndexes": [ 2025 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2015, 2025, 2018 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_5_output_0", "outputIndexes": [ 2026 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2026, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": [ 2027 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2028 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013, 2028, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": [ 2029 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2029 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": [ 2030 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2031 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013, 22, 2031, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": [ 2032 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 2032 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": [ 2033 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033, 2004 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": [ 2034 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014, 2034 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": [ 2035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4361 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2184913664, 2097174, 524288, 0, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 4370 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4370 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4371 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4371 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2036 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1958, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2037 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2038 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2037, 2038, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": [ 2039 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2036, 2039 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": [ 2040 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2006, 2035, 2040, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.18/self_attn/Reshape_7_output_0", "outputIndexes": [ 2041 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2041 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4372 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4373 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4373 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2187535126, 8388630, 2097152, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 4374 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4374 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4375 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4375 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2042 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1945, 2042 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_output_0", "outputIndexes": [ 2043 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2043 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2198020908, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2044 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4376 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4376 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4377 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4377 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2198053676, 25165846, 6291456, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 4378 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4378 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4379 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4379 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2045 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2045 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2046 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4377 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2229510978, 25165846, 6291456, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 4382 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4382 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4383 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4383 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2047 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2046, 2047 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": [ 2048 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2048 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4384 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4384 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4385 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4385 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2260968280, 25165846, 6291456, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 4386 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4386 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4387 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4387 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2049 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2043, 2049 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_1_output_0", "outputIndexes": [ 2050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/Reshape_output_0", "outputIndexes": [ 2051 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2051 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2292425582, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2052 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4388 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4388 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4389 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4389 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2292458350, 8388630, 2097152, 0, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 4390 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4390 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4391 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4391 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2053 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": [ 2054 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2054 ] , "main_type": "NONE", "name": "Shape8080", "outputIndexes": [ 2055 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2054 ] , "main_type": "NONE", "name": "Rank8082", "outputIndexes": [ 2056 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2056, 2056 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8084", "outputIndexes": [ 2057 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8085", "outputIndexes": [ 2058 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8087", "outputIndexes": [ 2059 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8088", "outputIndexes": [ 2060 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 2058, 2060, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8091", "outputIndexes": [ 2061 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2061 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8092", "outputIndexes": [ 2062 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062, 2062 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8094", "outputIndexes": [ 2063 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 2063, 2057 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": [ 2064 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2065 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8102", "outputIndexes": [ 2066 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8105", "outputIndexes": [ 2067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 2066, 2067, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8108", "outputIndexes": [ 2068 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8109", "outputIndexes": [ 2069 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2069 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8110", "outputIndexes": [ 2070 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2070, 2069 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8111", "outputIndexes": [ 2071 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 2071, 2057 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": [ 2072 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2065, 2073, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": [ 2074 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2053, 2074 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": [ 2075 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2075 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2302944132, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.19/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2077 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8129", "outputIndexes": [ 2078 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8132", "outputIndexes": [ 2079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2078, 2079, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8135", "outputIndexes": [ 2080 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2080 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8136", "outputIndexes": [ 2081 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2081, 2081 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8138", "outputIndexes": [ 2082 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2082, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": [ 2083 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 2083 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": [ 2084 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": [ 2085 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2085 ] , "main_type": "NONE", "name": "Shape8262", "outputIndexes": [ 2086 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2085 ] , "main_type": "NONE", "name": "Rank8264", "outputIndexes": [ 2087 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087, 2087 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8266", "outputIndexes": [ 2088 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8267", "outputIndexes": [ 2089 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8269", "outputIndexes": [ 2090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2090 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8270", "outputIndexes": [ 2091 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2086, 2089, 2091, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8273", "outputIndexes": [ 2092 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8274", "outputIndexes": [ 2093 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2093 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8275", "outputIndexes": [ 2094 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094, 2093 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8276", "outputIndexes": [ 2095 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085, 2095, 2088 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_4_output_0", "outputIndexes": [ 2096 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": [ 2097 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2098 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 2098, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": [ 2099 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": [ 2100 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2101 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 22, 2101, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": [ 2102 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2100, 2102 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": [ 2103 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8171", "outputIndexes": [ 2104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8174", "outputIndexes": [ 2105 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2104, 2105, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8177", "outputIndexes": [ 2106 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8178", "outputIndexes": [ 2107 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2107 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8179", "outputIndexes": [ 2108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2108, 2107 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8180", "outputIndexes": [ 2109 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2109, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": [ 2110 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103, 2110 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": [ 2111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084, 2111 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": [ 2112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4389 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2302945156, 2097174, 524288, 0, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 4394 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4394 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4395 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4395 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2113 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2114 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 2115, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": [ 2116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 2116 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": [ 2117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2305566618, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.19/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2119 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2083 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": [ 2120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": [ 2121 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2121 ] , "main_type": "NONE", "name": "Shape8142", "outputIndexes": [ 2122 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2121 ] , "main_type": "NONE", "name": "Rank8144", "outputIndexes": [ 2123 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2123, 2123 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8146", "outputIndexes": [ 2124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8147", "outputIndexes": [ 2125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8149", "outputIndexes": [ 2126 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2126 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8150", "outputIndexes": [ 2127 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122, 2125, 2127, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8153", "outputIndexes": [ 2128 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2128 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8154", "outputIndexes": [ 2129 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2129 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8155", "outputIndexes": [ 2130 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2130, 2129 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8156", "outputIndexes": [ 2131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2121, 2131, 2124 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_5_output_0", "outputIndexes": [ 2132 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2132, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": [ 2133 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2134 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2134, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": [ 2135 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2135 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": [ 2136 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 22, 2137, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": [ 2138 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2136, 2138 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": [ 2139 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2139, 2110 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": [ 2140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120, 2140 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": [ 2141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4389 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2305567642, 2097174, 524288, 0, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 4398 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4398 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4399 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4399 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2142 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2143 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2143, 2144, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": [ 2145 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2142, 2145 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": [ 2146 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2112, 2141, 2146, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.19/self_attn/Reshape_7_output_0", "outputIndexes": [ 2147 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4400 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4400 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4401 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4401 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2308189104, 8388630, 2097152, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 4402 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4402 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4403 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4403 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2148 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2051, 2148 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_output_0", "outputIndexes": [ 2149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2318674886, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2150 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2150 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4404 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4405 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4405 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2318707654, 25165846, 6291456, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 4406 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4406 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4407 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4407 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2151 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2152 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4405 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2350164956, 25165846, 6291456, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 4410 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4410 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4411 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4411 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2153 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2152, 2153 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": [ 2154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2154 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4412 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4412 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4413 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4413 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2381622258, 25165846, 6291456, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 4414 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4414 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4415 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4415 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2155 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149, 2155 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_1_output_0", "outputIndexes": [ 2156 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2156, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/Reshape_output_0", "outputIndexes": [ 2157 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2413079560, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2158 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4416 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4416 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4417 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4417 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2413112328, 8388630, 2097152, 0, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 4418 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4418 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4419 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4419 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2159 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": [ 2160 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2160 ] , "main_type": "NONE", "name": "Shape8501", "outputIndexes": [ 2161 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2160 ] , "main_type": "NONE", "name": "Rank8503", "outputIndexes": [ 2162 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2162, 2162 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8505", "outputIndexes": [ 2163 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2163 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8506", "outputIndexes": [ 2164 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2163, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8508", "outputIndexes": [ 2165 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2165 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8509", "outputIndexes": [ 2166 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 2164, 2166, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8512", "outputIndexes": [ 2167 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2167 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8513", "outputIndexes": [ 2168 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2168, 2168 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8515", "outputIndexes": [ 2169 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160, 2169, 2163 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": [ 2170 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2163 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8523", "outputIndexes": [ 2172 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2165 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8526", "outputIndexes": [ 2173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 2172, 2173, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8529", "outputIndexes": [ 2174 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8530", "outputIndexes": [ 2175 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8531", "outputIndexes": [ 2176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2176, 2175 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8532", "outputIndexes": [ 2177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160, 2177, 2163 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": [ 2178 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2179 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2171, 2179, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": [ 2180 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2159, 2180 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": [ 2181 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2181 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2423598110, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.20/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2183 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8550", "outputIndexes": [ 2184 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8553", "outputIndexes": [ 2185 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2184, 2185, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8556", "outputIndexes": [ 2186 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8557", "outputIndexes": [ 2187 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187, 2187 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8559", "outputIndexes": [ 2188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2188, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": [ 2189 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183, 2189 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": [ 2190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": [ 2191 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2191 ] , "main_type": "NONE", "name": "Shape8683", "outputIndexes": [ 2192 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2191 ] , "main_type": "NONE", "name": "Rank8685", "outputIndexes": [ 2193 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193, 2193 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8687", "outputIndexes": [ 2194 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2194 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8688", "outputIndexes": [ 2195 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2194, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8690", "outputIndexes": [ 2196 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2196 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8691", "outputIndexes": [ 2197 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2192, 2195, 2197, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8694", "outputIndexes": [ 2198 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8695", "outputIndexes": [ 2199 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2199 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8696", "outputIndexes": [ 2200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2200, 2199 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8697", "outputIndexes": [ 2201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191, 2201, 2194 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_4_output_0", "outputIndexes": [ 2202 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2202, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": [ 2203 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183, 2204, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": [ 2205 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2205 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": [ 2206 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2207 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183, 22, 2207, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": [ 2208 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 2208 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": [ 2209 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8592", "outputIndexes": [ 2210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8595", "outputIndexes": [ 2211 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2210, 2211, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8598", "outputIndexes": [ 2212 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2212 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8599", "outputIndexes": [ 2213 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2213 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8600", "outputIndexes": [ 2214 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2214, 2213 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8601", "outputIndexes": [ 2215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2215, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": [ 2216 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": [ 2217 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190, 2217 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": [ 2218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4417 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2423599134, 2097174, 524288, 0, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 4422 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4422 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4423 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4423 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2219 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2220 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2221 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220, 2221, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": [ 2222 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2219, 2222 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": [ 2223 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2223 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2426220596, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.20/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2225 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 2189 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": [ 2226 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": [ 2227 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2227 ] , "main_type": "NONE", "name": "Shape8563", "outputIndexes": [ 2228 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2227 ] , "main_type": "NONE", "name": "Rank8565", "outputIndexes": [ 2229 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2229, 2229 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8567", "outputIndexes": [ 2230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8568", "outputIndexes": [ 2231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8570", "outputIndexes": [ 2232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8571", "outputIndexes": [ 2233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2228, 2231, 2233, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8574", "outputIndexes": [ 2234 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2234 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8575", "outputIndexes": [ 2235 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2235 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8576", "outputIndexes": [ 2236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236, 2235 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8577", "outputIndexes": [ 2237 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2227, 2237, 2230 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_5_output_0", "outputIndexes": [ 2238 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": [ 2239 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2239, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2240 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 2240, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": [ 2241 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2241 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": [ 2242 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2239, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2243 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 22, 2243, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": [ 2244 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2242, 2244 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": [ 2245 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": [ 2246 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2226, 2246 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": [ 2247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4417 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2426221620, 2097174, 524288, 0, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 4426 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4426 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4427 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4427 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2248 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2249 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2250 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249, 2250, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": [ 2251 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2248, 2251 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": [ 2252 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2218, 2247, 2252, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.20/self_attn/Reshape_7_output_0", "outputIndexes": [ 2253 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2253 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4428 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4428 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4429 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4429 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2428843082, 8388630, 2097152, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 4430 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4430 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4431 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4431 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2254 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157, 2254 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_output_0", "outputIndexes": [ 2255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2255 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2439328864, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2256 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2256 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4432 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4433 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4433 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2439361632, 25165846, 6291456, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 4434 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4434 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4435 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4435 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2257 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2258 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4433 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2470818934, 25165846, 6291456, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 4438 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4438 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4439 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4439 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2259 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2258, 2259 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": [ 2260 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2260 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4440 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4440 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4441 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4441 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2502276236, 25165846, 6291456, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 4442 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4442 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4443 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4443 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2261 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2255, 2261 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_1_output_0", "outputIndexes": [ 2262 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2262, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/Reshape_output_0", "outputIndexes": [ 2263 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2533733538, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2264 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2264 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4444 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4444 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4445 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4445 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2533766306, 8388630, 2097152, 0, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 4446 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4446 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4447 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4447 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2265 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2264 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": [ 2266 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2266 ] , "main_type": "NONE", "name": "Shape8922", "outputIndexes": [ 2267 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2266 ] , "main_type": "NONE", "name": "Rank8924", "outputIndexes": [ 2268 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268, 2268 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8926", "outputIndexes": [ 2269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2269 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8927", "outputIndexes": [ 2270 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2269, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8929", "outputIndexes": [ 2271 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8930", "outputIndexes": [ 2272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2267, 2270, 2272, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8933", "outputIndexes": [ 2273 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8934", "outputIndexes": [ 2274 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274, 2274 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8936", "outputIndexes": [ 2275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2266, 2275, 2269 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": [ 2276 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2277 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2269 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8944", "outputIndexes": [ 2278 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8947", "outputIndexes": [ 2279 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2267, 2278, 2279, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8950", "outputIndexes": [ 2280 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2280 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8951", "outputIndexes": [ 2281 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2281 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8952", "outputIndexes": [ 2282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2282, 2281 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8953", "outputIndexes": [ 2283 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2266, 2283, 2269 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": [ 2284 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2285 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277, 2285, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": [ 2286 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265, 2286 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": [ 2287 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2287 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2544252088, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.21/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2289 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8971", "outputIndexes": [ 2290 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8974", "outputIndexes": [ 2291 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2290, 2291, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8977", "outputIndexes": [ 2292 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8978", "outputIndexes": [ 2293 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2293, 2293 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8980", "outputIndexes": [ 2294 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2294, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": [ 2295 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289, 2295 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": [ 2296 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": [ 2297 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2297 ] , "main_type": "NONE", "name": "Shape9104", "outputIndexes": [ 2298 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2297 ] , "main_type": "NONE", "name": "Rank9106", "outputIndexes": [ 2299 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 2299 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9108", "outputIndexes": [ 2300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9109", "outputIndexes": [ 2301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9111", "outputIndexes": [ 2302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9112", "outputIndexes": [ 2303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2298, 2301, 2303, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9115", "outputIndexes": [ 2304 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9116", "outputIndexes": [ 2305 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2305 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9117", "outputIndexes": [ 2306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2306, 2305 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9118", "outputIndexes": [ 2307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 2307, 2300 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_4_output_0", "outputIndexes": [ 2308 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": [ 2309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2310 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289, 2310, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": [ 2311 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": [ 2312 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2313 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289, 22, 2313, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": [ 2314 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2312, 2314 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": [ 2315 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9013", "outputIndexes": [ 2316 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9016", "outputIndexes": [ 2317 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2316, 2317, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9019", "outputIndexes": [ 2318 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2318 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9020", "outputIndexes": [ 2319 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2319 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9021", "outputIndexes": [ 2320 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2320, 2319 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9022", "outputIndexes": [ 2321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2321, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": [ 2322 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315, 2322 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": [ 2323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2296, 2323 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": [ 2324 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4445 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2544253112, 2097174, 524288, 0, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 4450 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4450 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4451 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4451 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2325 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2326 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2327 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2326, 2327, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": [ 2328 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2325, 2328 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": [ 2329 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2546874574, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.21/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2331 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331, 2295 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": [ 2332 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": [ 2333 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2333 ] , "main_type": "NONE", "name": "Shape8984", "outputIndexes": [ 2334 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2333 ] , "main_type": "NONE", "name": "Rank8986", "outputIndexes": [ 2335 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2335, 2335 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8988", "outputIndexes": [ 2336 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8989", "outputIndexes": [ 2337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8991", "outputIndexes": [ 2338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8992", "outputIndexes": [ 2339 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2334, 2337, 2339, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8995", "outputIndexes": [ 2340 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8996", "outputIndexes": [ 2341 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2341 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8997", "outputIndexes": [ 2342 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2342, 2341 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8998", "outputIndexes": [ 2343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333, 2343, 2336 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_5_output_0", "outputIndexes": [ 2344 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2344, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": [ 2345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331, 2346, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": [ 2347 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2347 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": [ 2348 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2349 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331, 22, 2349, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": [ 2350 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2348, 2350 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": [ 2351 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2351, 2322 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": [ 2352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2332, 2352 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": [ 2353 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4445 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2546875598, 2097174, 524288, 0, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 4454 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4454 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4455 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4455 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2354 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2355 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2356 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355, 2356, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": [ 2357 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354, 2357 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": [ 2358 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 2353, 2358, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.21/self_attn/Reshape_7_output_0", "outputIndexes": [ 2359 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2359 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4456 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4456 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4457 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4457 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2549497060, 8388630, 2097152, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 4458 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4458 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4459 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4459 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263, 2360 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_output_0", "outputIndexes": [ 2361 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2559982842, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2362 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2362 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4460 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4460 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4461 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4461 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2560015610, 25165846, 6291456, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 4462 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4462 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4463 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4463 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2363 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2364 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4461 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2591472912, 25165846, 6291456, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 4466 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4466 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4467 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4467 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2365 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364, 2365 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": [ 2366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4468 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4469 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4469 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2622930214, 25165846, 6291456, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 4470 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4470 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4471 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4471 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2367 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361, 2367 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_1_output_0", "outputIndexes": [ 2368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/Reshape_output_0", "outputIndexes": [ 2369 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2369 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2654387516, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2370 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4472 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4472 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4473 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4473 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2654420284, 8388630, 2097152, 0, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 4474 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4474 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4475 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4475 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2371 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": [ 2372 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2372 ] , "main_type": "NONE", "name": "Shape9343", "outputIndexes": [ 2373 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2372 ] , "main_type": "NONE", "name": "Rank9345", "outputIndexes": [ 2374 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2374, 2374 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9347", "outputIndexes": [ 2375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9348", "outputIndexes": [ 2376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9350", "outputIndexes": [ 2377 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9351", "outputIndexes": [ 2378 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 2376, 2378, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9354", "outputIndexes": [ 2379 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9355", "outputIndexes": [ 2380 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2380, 2380 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9357", "outputIndexes": [ 2381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372, 2381, 2375 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": [ 2382 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2382, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2383 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9365", "outputIndexes": [ 2384 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9368", "outputIndexes": [ 2385 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 2384, 2385, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9371", "outputIndexes": [ 2386 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9372", "outputIndexes": [ 2387 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2387 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9373", "outputIndexes": [ 2388 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2388, 2387 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9374", "outputIndexes": [ 2389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372, 2389, 2375 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": [ 2390 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2391 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383, 2391, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": [ 2392 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371, 2392 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": [ 2393 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2393 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2664906066, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.22/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2395 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9392", "outputIndexes": [ 2396 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9395", "outputIndexes": [ 2397 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2396, 2397, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9398", "outputIndexes": [ 2398 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2398 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9399", "outputIndexes": [ 2399 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399, 2399 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9401", "outputIndexes": [ 2400 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2400, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": [ 2401 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395, 2401 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": [ 2402 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": [ 2403 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2403 ] , "main_type": "NONE", "name": "Shape9525", "outputIndexes": [ 2404 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2403 ] , "main_type": "NONE", "name": "Rank9527", "outputIndexes": [ 2405 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2405, 2405 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9529", "outputIndexes": [ 2406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9530", "outputIndexes": [ 2407 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9532", "outputIndexes": [ 2408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9533", "outputIndexes": [ 2409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2404, 2407, 2409, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9536", "outputIndexes": [ 2410 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2410 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9537", "outputIndexes": [ 2411 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2411 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9538", "outputIndexes": [ 2412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2412, 2411 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9539", "outputIndexes": [ 2413 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2403, 2413, 2406 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_4_output_0", "outputIndexes": [ 2414 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2414, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": [ 2415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2415, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395, 2416, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": [ 2417 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2417 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": [ 2418 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2415, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2419 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395, 22, 2419, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": [ 2420 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2418, 2420 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": [ 2421 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9434", "outputIndexes": [ 2422 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9437", "outputIndexes": [ 2423 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2422, 2423, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9440", "outputIndexes": [ 2424 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9441", "outputIndexes": [ 2425 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2425 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9442", "outputIndexes": [ 2426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426, 2425 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9443", "outputIndexes": [ 2427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2427, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": [ 2428 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2421, 2428 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": [ 2429 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2402, 2429 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": [ 2430 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4473 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2664907090, 2097174, 524288, 0, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 4478 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4478 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4479 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4479 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2431 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2382, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2433 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2432, 2433, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": [ 2434 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431, 2434 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": [ 2435 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2435 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2667528552, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.22/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2437 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437, 2401 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": [ 2438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": [ 2439 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2439 ] , "main_type": "NONE", "name": "Shape9405", "outputIndexes": [ 2440 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2439 ] , "main_type": "NONE", "name": "Rank9407", "outputIndexes": [ 2441 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441, 2441 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9409", "outputIndexes": [ 2442 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2442 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9410", "outputIndexes": [ 2443 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2442, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9412", "outputIndexes": [ 2444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2444 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9413", "outputIndexes": [ 2445 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2440, 2443, 2445, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9416", "outputIndexes": [ 2446 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2446 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9417", "outputIndexes": [ 2447 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2447 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9418", "outputIndexes": [ 2448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2448, 2447 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9419", "outputIndexes": [ 2449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439, 2449, 2442 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_5_output_0", "outputIndexes": [ 2450 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": [ 2451 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2452 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437, 2452, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": [ 2453 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2453 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": [ 2454 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2455 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437, 22, 2455, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": [ 2456 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454, 2456 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": [ 2457 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457, 2428 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": [ 2458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2438, 2458 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": [ 2459 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4473 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2667529576, 2097174, 524288, 0, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 4482 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4482 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4483 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4483 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2460 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2382, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2461 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2462 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461, 2462, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": [ 2463 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2460, 2463 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": [ 2464 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2430, 2459, 2464, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.22/self_attn/Reshape_7_output_0", "outputIndexes": [ 2465 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4484 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4484 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4485 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4485 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2670151038, 8388630, 2097152, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 4486 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4486 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4487 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4487 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2369, 2466 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_output_0", "outputIndexes": [ 2467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2680636820, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2468 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4488 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4488 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4489 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4489 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2680669588, 25165846, 6291456, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 4490 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4490 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4491 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4491 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2469 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2469 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2470 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4489 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2712126890, 25165846, 6291456, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 4494 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4494 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4495 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4495 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2471 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 2471 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": [ 2472 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4496 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4497 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4497 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2743584192, 25165846, 6291456, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 4498 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4498 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4499 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4499 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2473 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467, 2473 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_1_output_0", "outputIndexes": [ 2474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2474, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/Reshape_output_0", "outputIndexes": [ 2475 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2775041494, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2476 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4500 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4500 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4501 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4501 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2775074262, 8388630, 2097152, 0, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 4502 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4502 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4503 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4503 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2477 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": [ 2478 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2478 ] , "main_type": "NONE", "name": "Shape9764", "outputIndexes": [ 2479 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2478 ] , "main_type": "NONE", "name": "Rank9766", "outputIndexes": [ 2480 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480, 2480 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9768", "outputIndexes": [ 2481 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2481 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9769", "outputIndexes": [ 2482 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2481, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9771", "outputIndexes": [ 2483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9772", "outputIndexes": [ 2484 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2479, 2482, 2484, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9775", "outputIndexes": [ 2485 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9776", "outputIndexes": [ 2486 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2486, 2486 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9778", "outputIndexes": [ 2487 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 2487, 2481 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": [ 2488 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2489 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2481 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9786", "outputIndexes": [ 2490 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9789", "outputIndexes": [ 2491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2479, 2490, 2491, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9792", "outputIndexes": [ 2492 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2492 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9793", "outputIndexes": [ 2493 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2493 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9794", "outputIndexes": [ 2494 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2494, 2493 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9795", "outputIndexes": [ 2495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 2495, 2481 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": [ 2496 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2497 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489, 2497, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": [ 2498 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 2498 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": [ 2499 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2499 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2785560044, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.23/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2501 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9813", "outputIndexes": [ 2502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9816", "outputIndexes": [ 2503 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2502, 2503, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9819", "outputIndexes": [ 2504 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9820", "outputIndexes": [ 2505 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505, 2505 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9822", "outputIndexes": [ 2506 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2506, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": [ 2507 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501, 2507 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": [ 2508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": [ 2509 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2509 ] , "main_type": "NONE", "name": "Shape9946", "outputIndexes": [ 2510 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2509 ] , "main_type": "NONE", "name": "Rank9948", "outputIndexes": [ 2511 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2511, 2511 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9950", "outputIndexes": [ 2512 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2512 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9951", "outputIndexes": [ 2513 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2512, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9953", "outputIndexes": [ 2514 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2514 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9954", "outputIndexes": [ 2515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2510, 2513, 2515, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9957", "outputIndexes": [ 2516 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9958", "outputIndexes": [ 2517 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2517 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9959", "outputIndexes": [ 2518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2518, 2517 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9960", "outputIndexes": [ 2519 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2509, 2519, 2512 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_4_output_0", "outputIndexes": [ 2520 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2520, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": [ 2521 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2521, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2522 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501, 2522, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": [ 2523 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": [ 2524 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2521, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501, 22, 2525, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": [ 2526 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524, 2526 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": [ 2527 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9855", "outputIndexes": [ 2528 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9858", "outputIndexes": [ 2529 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2528, 2529, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9861", "outputIndexes": [ 2530 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2530 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9862", "outputIndexes": [ 2531 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2531 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9863", "outputIndexes": [ 2532 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532, 2531 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9864", "outputIndexes": [ 2533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2533, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": [ 2534 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2527, 2534 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": [ 2535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2508, 2535 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": [ 2536 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4501 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2785561068, 2097174, 524288, 0, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 4506 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4506 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4507 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4507 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2537 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2538 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2538, 2539, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": [ 2540 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2537, 2540 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": [ 2541 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2788182530, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.23/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2543 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2507 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": [ 2544 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": [ 2545 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2545 ] , "main_type": "NONE", "name": "Shape9826", "outputIndexes": [ 2546 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2545 ] , "main_type": "NONE", "name": "Rank9828", "outputIndexes": [ 2547 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2547, 2547 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9830", "outputIndexes": [ 2548 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9831", "outputIndexes": [ 2549 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9833", "outputIndexes": [ 2550 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2550 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9834", "outputIndexes": [ 2551 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546, 2549, 2551, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9837", "outputIndexes": [ 2552 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2552 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9838", "outputIndexes": [ 2553 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2553 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9839", "outputIndexes": [ 2554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2554, 2553 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9840", "outputIndexes": [ 2555 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2545, 2555, 2548 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_5_output_0", "outputIndexes": [ 2556 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2556, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": [ 2557 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2558 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2558, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": [ 2559 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": [ 2560 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2561 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 22, 2561, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": [ 2562 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2560, 2562 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": [ 2563 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563, 2534 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": [ 2564 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 2564 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": [ 2565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4501 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2788183554, 2097174, 524288, 0, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 4510 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4510 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4511 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4511 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2566 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2567 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567, 2568, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": [ 2569 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2566, 2569 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": [ 2570 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536, 2565, 2570, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.23/self_attn/Reshape_7_output_0", "outputIndexes": [ 2571 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2571 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4512 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4512 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4513 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4513 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2790805016, 8388630, 2097152, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 4514 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4514 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4515 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4515 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2572 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 2572 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_output_0", "outputIndexes": [ 2573 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2801290798, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2574 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2574 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4516 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4516 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4517 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4517 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2801323566, 25165846, 6291456, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 4518 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4518 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4519 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4519 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2575 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2575 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2576 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4517 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2832780868, 25165846, 6291456, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 4522 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4522 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4523 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4523 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2577 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576, 2577 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": [ 2578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4524 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4524 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4525 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4525 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2864238170, 25165846, 6291456, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 4526 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4526 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4527 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4527 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2579 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573, 2579 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_1_output_0", "outputIndexes": [ 2580 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2580, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/Reshape_output_0", "outputIndexes": [ 2581 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2895695472, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2582 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2582 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4528 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4528 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4529 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4529 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2895728240, 8388630, 2097152, 0, 0 ] } , "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": [ 4530 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4530 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4531 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4531 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2582 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": [ 2584 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2584 ] , "main_type": "NONE", "name": "Shape10185", "outputIndexes": [ 2585 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2584 ] , "main_type": "NONE", "name": "Rank10187", "outputIndexes": [ 2586 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2586, 2586 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10189", "outputIndexes": [ 2587 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10190", "outputIndexes": [ 2588 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10192", "outputIndexes": [ 2589 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10193", "outputIndexes": [ 2590 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585, 2588, 2590, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10196", "outputIndexes": [ 2591 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10197", "outputIndexes": [ 2592 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592, 2592 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10199", "outputIndexes": [ 2593 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584, 2593, 2587 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": [ 2594 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10207", "outputIndexes": [ 2596 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10210", "outputIndexes": [ 2597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585, 2596, 2597, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10213", "outputIndexes": [ 2598 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2598 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10214", "outputIndexes": [ 2599 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2599 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10215", "outputIndexes": [ 2600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2600, 2599 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10216", "outputIndexes": [ 2601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584, 2601, 2587 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": [ 2602 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2603 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2595, 2603, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": [ 2604 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583, 2604 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": [ 2605 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2906214022, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.24/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2607 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10234", "outputIndexes": [ 2608 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10237", "outputIndexes": [ 2609 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2608, 2609, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10240", "outputIndexes": [ 2610 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2610 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10241", "outputIndexes": [ 2611 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2611, 2611 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10243", "outputIndexes": [ 2612 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2612, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": [ 2613 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607, 2613 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": [ 2614 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": [ 2615 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2615 ] , "main_type": "NONE", "name": "Shape10367", "outputIndexes": [ 2616 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2615 ] , "main_type": "NONE", "name": "Rank10369", "outputIndexes": [ 2617 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617, 2617 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10371", "outputIndexes": [ 2618 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2618 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10372", "outputIndexes": [ 2619 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2618, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10374", "outputIndexes": [ 2620 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2620 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10375", "outputIndexes": [ 2621 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2616, 2619, 2621, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10378", "outputIndexes": [ 2622 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10379", "outputIndexes": [ 2623 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2623 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10380", "outputIndexes": [ 2624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624, 2623 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10381", "outputIndexes": [ 2625 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2615, 2625, 2618 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_4_output_0", "outputIndexes": [ 2626 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": [ 2627 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2627, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607, 2628, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": [ 2629 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": [ 2630 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2627, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2631 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607, 22, 2631, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": [ 2632 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630, 2632 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": [ 2633 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10276", "outputIndexes": [ 2634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10279", "outputIndexes": [ 2635 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2634, 2635, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10282", "outputIndexes": [ 2636 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2636 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10283", "outputIndexes": [ 2637 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2637 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10284", "outputIndexes": [ 2638 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2638, 2637 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10285", "outputIndexes": [ 2639 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2639, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": [ 2640 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633, 2640 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": [ 2641 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2614, 2641 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": [ 2642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4529 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2906215046, 2097174, 524288, 0, 0 ] } , "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": [ 4534 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4534 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4535 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4535 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2643 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2644 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2645 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2644, 2645, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": [ 2646 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2643, 2646 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": [ 2647 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2647 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2908836508, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.24/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2649 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649, 2613 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": [ 2650 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": [ 2651 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2651 ] , "main_type": "NONE", "name": "Shape10247", "outputIndexes": [ 2652 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2651 ] , "main_type": "NONE", "name": "Rank10249", "outputIndexes": [ 2653 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 2653 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10251", "outputIndexes": [ 2654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10252", "outputIndexes": [ 2655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10254", "outputIndexes": [ 2656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10255", "outputIndexes": [ 2657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2652, 2655, 2657, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10258", "outputIndexes": [ 2658 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10259", "outputIndexes": [ 2659 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2659 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10260", "outputIndexes": [ 2660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2660, 2659 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10261", "outputIndexes": [ 2661 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651, 2661, 2654 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_5_output_0", "outputIndexes": [ 2662 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2662, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": [ 2663 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2664 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649, 2664, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": [ 2665 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": [ 2666 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2667 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649, 22, 2667, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": [ 2668 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2666, 2668 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": [ 2669 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2669, 2640 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": [ 2670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650, 2670 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": [ 2671 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4529 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2908837532, 2097174, 524288, 0, 0 ] } , "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": [ 4538 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4538 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4539 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4539 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2672 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2673 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2674 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2673, 2674, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": [ 2675 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2672, 2675 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": [ 2676 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 2671, 2676, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.24/self_attn/Reshape_7_output_0", "outputIndexes": [ 2677 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2677 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4540 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4540 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4541 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4541 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2911458994, 8388630, 2097152, 0, 0 ] } , "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": [ 4542 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4542 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4543 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4543 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2678 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581, 2678 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_output_0", "outputIndexes": [ 2679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2921944776, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2680 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4544 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4544 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4545 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4545 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2921977544, 25165846, 6291456, 0, 0 ] } , "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": [ 4546 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4546 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4547 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4547 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2681 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2681 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2682 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4545 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2953434846, 25165846, 6291456, 0, 0 ] } , "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": [ 4550 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4550 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4551 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4551 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2683 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682, 2683 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": [ 2684 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2684 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4552 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4552 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4553 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4553 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2984892148, 25165846, 6291456, 0, 0 ] } , "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": [ 4554 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4554 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4555 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4555 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2685 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679, 2685 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_1_output_0", "outputIndexes": [ 2686 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2686, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/Reshape_output_0", "outputIndexes": [ 2687 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3016349450, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2688 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2688 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4556 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4556 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4557 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4557 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3016382218, 8388630, 2097152, 0, 0 ] } , "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": [ 4558 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4558 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4559 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4559 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2689 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2688 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": [ 2690 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2690 ] , "main_type": "NONE", "name": "Shape10606", "outputIndexes": [ 2691 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2690 ] , "main_type": "NONE", "name": "Rank10608", "outputIndexes": [ 2692 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2692, 2692 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10610", "outputIndexes": [ 2693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10611", "outputIndexes": [ 2694 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10613", "outputIndexes": [ 2695 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2695 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10614", "outputIndexes": [ 2696 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691, 2694, 2696, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10617", "outputIndexes": [ 2697 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2697 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10618", "outputIndexes": [ 2698 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2698, 2698 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10620", "outputIndexes": [ 2699 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2690, 2699, 2693 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": [ 2700 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10628", "outputIndexes": [ 2702 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2695 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10631", "outputIndexes": [ 2703 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691, 2702, 2703, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10634", "outputIndexes": [ 2704 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2704 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10635", "outputIndexes": [ 2705 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2705 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10636", "outputIndexes": [ 2706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2706, 2705 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10637", "outputIndexes": [ 2707 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2690, 2707, 2693 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": [ 2708 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2709 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2701, 2709, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": [ 2710 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2689, 2710 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": [ 2711 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2711 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3026868000, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.25/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2713 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10655", "outputIndexes": [ 2714 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10658", "outputIndexes": [ 2715 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2714, 2715, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10661", "outputIndexes": [ 2716 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2716 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10662", "outputIndexes": [ 2717 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717, 2717 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10664", "outputIndexes": [ 2718 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2718, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": [ 2719 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 2719 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": [ 2720 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": [ 2721 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2721 ] , "main_type": "NONE", "name": "Shape10788", "outputIndexes": [ 2722 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2721 ] , "main_type": "NONE", "name": "Rank10790", "outputIndexes": [ 2723 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2723, 2723 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10792", "outputIndexes": [ 2724 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10793", "outputIndexes": [ 2725 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10795", "outputIndexes": [ 2726 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10796", "outputIndexes": [ 2727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 2725, 2727, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10799", "outputIndexes": [ 2728 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2728 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10800", "outputIndexes": [ 2729 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2729 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10801", "outputIndexes": [ 2730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730, 2729 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10802", "outputIndexes": [ 2731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721, 2731, 2724 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_4_output_0", "outputIndexes": [ 2732 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2732, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": [ 2733 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2734 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 2734, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": [ 2735 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": [ 2736 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2737 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 22, 2737, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": [ 2738 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2736, 2738 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": [ 2739 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10697", "outputIndexes": [ 2740 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10700", "outputIndexes": [ 2741 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2740, 2741, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10703", "outputIndexes": [ 2742 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10704", "outputIndexes": [ 2743 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2743 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10705", "outputIndexes": [ 2744 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744, 2743 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10706", "outputIndexes": [ 2745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2745, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": [ 2746 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739, 2746 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": [ 2747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720, 2747 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": [ 2748 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4557 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3026869024, 2097174, 524288, 0, 0 ] } , "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": [ 4562 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4562 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4563 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4563 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2750 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2751 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2750, 2751, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": [ 2752 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749, 2752 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": [ 2753 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2753 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3029490486, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.25/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2755 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755, 2719 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": [ 2756 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": [ 2757 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2757 ] , "main_type": "NONE", "name": "Shape10668", "outputIndexes": [ 2758 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2757 ] , "main_type": "NONE", "name": "Rank10670", "outputIndexes": [ 2759 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2759, 2759 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10672", "outputIndexes": [ 2760 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2760 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10673", "outputIndexes": [ 2761 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2760, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10675", "outputIndexes": [ 2762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10676", "outputIndexes": [ 2763 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2758, 2761, 2763, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10679", "outputIndexes": [ 2764 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10680", "outputIndexes": [ 2765 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2765 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10681", "outputIndexes": [ 2766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766, 2765 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10682", "outputIndexes": [ 2767 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2757, 2767, 2760 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_5_output_0", "outputIndexes": [ 2768 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2768, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": [ 2769 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2770 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755, 2770, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": [ 2771 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": [ 2772 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2773 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755, 22, 2773, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": [ 2774 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772, 2774 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": [ 2775 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775, 2746 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": [ 2776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756, 2776 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": [ 2777 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4557 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3029491510, 2097174, 524288, 0, 0 ] } , "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": [ 4566 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4566 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4567 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4567 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2778 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2779 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2780 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2779, 2780, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": [ 2781 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778, 2781 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": [ 2782 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2748, 2777, 2782, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.25/self_attn/Reshape_7_output_0", "outputIndexes": [ 2783 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2783 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4568 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4568 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4569 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4569 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3032112972, 8388630, 2097152, 0, 0 ] } , "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": [ 4570 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4570 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4571 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4571 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2784 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687, 2784 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_output_0", "outputIndexes": [ 2785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2785 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3042598754, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2786 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2786 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4572 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4572 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4573 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4573 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3042631522, 25165846, 6291456, 0, 0 ] } , "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": [ 4574 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4574 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4575 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4575 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2787 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2787 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2788 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4573 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3074088824, 25165846, 6291456, 0, 0 ] } , "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": [ 4578 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4578 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4579 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4579 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2789 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2788, 2789 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": [ 2790 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2790 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4580 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4580 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4581 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4581 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3105546126, 25165846, 6291456, 0, 0 ] } , "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": [ 4582 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4582 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4583 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4583 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2791 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2785, 2791 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_1_output_0", "outputIndexes": [ 2792 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2792, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/Reshape_output_0", "outputIndexes": [ 2793 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2793 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3137003428, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.26/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2794 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4584 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4584 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4585 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4585 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3137036196, 8388630, 2097152, 0, 0 ] } , "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": [ 4586 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4586 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4587 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4587 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2795 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_output_0", "outputIndexes": [ 2796 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2796 ] , "main_type": "NONE", "name": "Shape11027", "outputIndexes": [ 2797 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2796 ] , "main_type": "NONE", "name": "Rank11029", "outputIndexes": [ 2798 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2798, 2798 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11031", "outputIndexes": [ 2799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11032", "outputIndexes": [ 2800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11034", "outputIndexes": [ 2801 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2801 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11035", "outputIndexes": [ 2802 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797, 2800, 2802, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11038", "outputIndexes": [ 2803 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11039", "outputIndexes": [ 2804 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804, 2804 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11041", "outputIndexes": [ 2805 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2796, 2805, 2799 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_output_0", "outputIndexes": [ 2806 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11049", "outputIndexes": [ 2808 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2801 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11052", "outputIndexes": [ 2809 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797, 2808, 2809, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11055", "outputIndexes": [ 2810 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11056", "outputIndexes": [ 2811 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2811 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11057", "outputIndexes": [ 2812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2812, 2811 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11058", "outputIndexes": [ 2813 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2796, 2813, 2799 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_1_output_0", "outputIndexes": [ 2814 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2814, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2815 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807, 2815, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_output_0", "outputIndexes": [ 2816 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2795, 2816 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_output_0", "outputIndexes": [ 2817 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2817 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3147521978, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.26/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2819 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11076", "outputIndexes": [ 2820 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11079", "outputIndexes": [ 2821 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2820, 2821, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11082", "outputIndexes": [ 2822 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2822 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11083", "outputIndexes": [ 2823 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2823, 2823 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11085", "outputIndexes": [ 2824 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2824, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_2_output_0", "outputIndexes": [ 2825 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819, 2825 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_output_0", "outputIndexes": [ 2826 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_2_output_0", "outputIndexes": [ 2827 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2827 ] , "main_type": "NONE", "name": "Shape11209", "outputIndexes": [ 2828 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2827 ] , "main_type": "NONE", "name": "Rank11211", "outputIndexes": [ 2829 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829, 2829 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11213", "outputIndexes": [ 2830 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2830 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11214", "outputIndexes": [ 2831 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2830, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11216", "outputIndexes": [ 2832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11217", "outputIndexes": [ 2833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 2831, 2833, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11220", "outputIndexes": [ 2834 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2834 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11221", "outputIndexes": [ 2835 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2835 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11222", "outputIndexes": [ 2836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836, 2835 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11223", "outputIndexes": [ 2837 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2827, 2837, 2830 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_4_output_0", "outputIndexes": [ 2838 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2838, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_output_0", "outputIndexes": [ 2839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2839, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819, 2840, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_1_output_0", "outputIndexes": [ 2841 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2841 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_output_0", "outputIndexes": [ 2842 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2839, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2843 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819, 22, 2843, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_output_0", "outputIndexes": [ 2844 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842, 2844 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_3_output_0", "outputIndexes": [ 2845 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11118", "outputIndexes": [ 2846 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11121", "outputIndexes": [ 2847 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2846, 2847, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11124", "outputIndexes": [ 2848 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2848 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11125", "outputIndexes": [ 2849 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2849 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11126", "outputIndexes": [ 2850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2850, 2849 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11127", "outputIndexes": [ 2851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2851, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_3_output_0", "outputIndexes": [ 2852 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845, 2852 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_1_output_0", "outputIndexes": [ 2853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826, 2853 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_output_0", "outputIndexes": [ 2854 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4585 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3147523002, 2097174, 524288, 0, 0 ] } , "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": [ 4590 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4590 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4591 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4591 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2855 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2814, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2857 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856, 2857, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_1_output_0", "outputIndexes": [ 2858 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2855, 2858 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_1_output_0", "outputIndexes": [ 2859 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3150144464, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.26/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2861 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 2825 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_2_output_0", "outputIndexes": [ 2862 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_3_output_0", "outputIndexes": [ 2863 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2863 ] , "main_type": "NONE", "name": "Shape11089", "outputIndexes": [ 2864 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2863 ] , "main_type": "NONE", "name": "Rank11091", "outputIndexes": [ 2865 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2865, 2865 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11093", "outputIndexes": [ 2866 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2866 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11094", "outputIndexes": [ 2867 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2866, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11096", "outputIndexes": [ 2868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2868 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11097", "outputIndexes": [ 2869 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2864, 2867, 2869, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11100", "outputIndexes": [ 2870 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2870 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11101", "outputIndexes": [ 2871 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2871 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11102", "outputIndexes": [ 2872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2872, 2871 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11103", "outputIndexes": [ 2873 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2863, 2873, 2866 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_5_output_0", "outputIndexes": [ 2874 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2874, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_1_output_0", "outputIndexes": [ 2875 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2875, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2876 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 2876, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_3_output_0", "outputIndexes": [ 2877 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2877 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_1_output_0", "outputIndexes": [ 2878 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2875, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 22, 2879, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_2_output_0", "outputIndexes": [ 2880 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2878, 2880 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_4_output_0", "outputIndexes": [ 2881 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2881, 2852 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_3_output_0", "outputIndexes": [ 2882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2862, 2882 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_1_output_0", "outputIndexes": [ 2883 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4585 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3150145488, 2097174, 524288, 0, 0 ] } , "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": [ 4594 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4594 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4595 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4595 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2884 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2885 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2814, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2885, 2886, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_2_output_0", "outputIndexes": [ 2887 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2884, 2887 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_2_output_0", "outputIndexes": [ 2888 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2854, 2883, 2888, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.26/self_attn/Reshape_7_output_0", "outputIndexes": [ 2889 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2889 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4596 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4596 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4597 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4597 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3152766950, 8388630, 2097152, 0, 0 ] } , "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": [ 4598 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4598 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4599 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4599 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2890 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2793, 2890 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_output_0", "outputIndexes": [ 2891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2891 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3163252732, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.26/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2892 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2892 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4600 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4600 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4601 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4601 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3163285500, 25165846, 6291456, 0, 0 ] } , "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": [ 4602 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4602 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4603 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4603 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2893 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2893 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.26/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2894 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4601 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3194742802, 25165846, 6291456, 0, 0 ] } , "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": [ 4606 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4606 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4607 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4607 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2895 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2894, 2895 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/mlp/Mul_output_0", "outputIndexes": [ 2896 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2896 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4608 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4608 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4609 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4609 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3226200104, 25165846, 6291456, 0, 0 ] } , "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": [ 4610 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4610 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4611 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4611 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2897 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2891, 2897 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_1_output_0", "outputIndexes": [ 2898 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/Reshape_output_0", "outputIndexes": [ 2899 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3257657406, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.27/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2900 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4612 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4613 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4613 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3257690174, 8388630, 2097152, 0, 0 ] } , "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": [ 4614 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4614 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4615 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4615 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2901 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_output_0", "outputIndexes": [ 2902 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2902 ] , "main_type": "NONE", "name": "Shape11448", "outputIndexes": [ 2903 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2902 ] , "main_type": "NONE", "name": "Rank11450", "outputIndexes": [ 2904 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2904, 2904 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11452", "outputIndexes": [ 2905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11453", "outputIndexes": [ 2906 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11455", "outputIndexes": [ 2907 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2907 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11456", "outputIndexes": [ 2908 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903, 2906, 2908, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11459", "outputIndexes": [ 2909 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2909 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11460", "outputIndexes": [ 2910 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2910, 2910 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11462", "outputIndexes": [ 2911 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2902, 2911, 2905 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_output_0", "outputIndexes": [ 2912 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11470", "outputIndexes": [ 2914 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2907 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11473", "outputIndexes": [ 2915 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903, 2914, 2915, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11476", "outputIndexes": [ 2916 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11477", "outputIndexes": [ 2917 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2917 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11478", "outputIndexes": [ 2918 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2918, 2917 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11479", "outputIndexes": [ 2919 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2902, 2919, 2905 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_1_output_0", "outputIndexes": [ 2920 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2920, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2921 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2913, 2921, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_output_0", "outputIndexes": [ 2922 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901, 2922 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_output_0", "outputIndexes": [ 2923 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2923 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3268175956, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.27/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2925 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11497", "outputIndexes": [ 2926 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11500", "outputIndexes": [ 2927 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2926, 2927, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11503", "outputIndexes": [ 2928 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11504", "outputIndexes": [ 2929 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2929, 2929 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11506", "outputIndexes": [ 2930 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2930, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_2_output_0", "outputIndexes": [ 2931 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925, 2931 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_output_0", "outputIndexes": [ 2932 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_2_output_0", "outputIndexes": [ 2933 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2933 ] , "main_type": "NONE", "name": "Shape11630", "outputIndexes": [ 2934 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2933 ] , "main_type": "NONE", "name": "Rank11632", "outputIndexes": [ 2935 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2935, 2935 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11634", "outputIndexes": [ 2936 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2936 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11635", "outputIndexes": [ 2937 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2936, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11637", "outputIndexes": [ 2938 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2938 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11638", "outputIndexes": [ 2939 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934, 2937, 2939, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11641", "outputIndexes": [ 2940 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2940 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11642", "outputIndexes": [ 2941 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2941 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11643", "outputIndexes": [ 2942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2942, 2941 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11644", "outputIndexes": [ 2943 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2933, 2943, 2936 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_4_output_0", "outputIndexes": [ 2944 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_output_0", "outputIndexes": [ 2945 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2945, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2946 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925, 2946, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_1_output_0", "outputIndexes": [ 2947 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2947 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_output_0", "outputIndexes": [ 2948 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2945, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2949 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925, 22, 2949, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_output_0", "outputIndexes": [ 2950 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2948, 2950 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_3_output_0", "outputIndexes": [ 2951 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11539", "outputIndexes": [ 2952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11542", "outputIndexes": [ 2953 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 2952, 2953, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11545", "outputIndexes": [ 2954 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11546", "outputIndexes": [ 2955 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2955 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11547", "outputIndexes": [ 2956 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956, 2955 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11548", "outputIndexes": [ 2957 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 2957, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_3_output_0", "outputIndexes": [ 2958 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2951, 2958 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_1_output_0", "outputIndexes": [ 2959 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2932, 2959 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_output_0", "outputIndexes": [ 2960 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4613 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3268176980, 2097174, 524288, 0, 0 ] } , "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": [ 4618 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4618 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4619 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4619 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2961 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2962 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2920, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2963 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2962, 2963, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_1_output_0", "outputIndexes": [ 2964 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2961, 2964 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_1_output_0", "outputIndexes": [ 2965 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2965 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3270798442, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.27/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2967 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967, 2931 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_2_output_0", "outputIndexes": [ 2968 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_3_output_0", "outputIndexes": [ 2969 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2969 ] , "main_type": "NONE", "name": "Shape11510", "outputIndexes": [ 2970 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2969 ] , "main_type": "NONE", "name": "Rank11512", "outputIndexes": [ 2971 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2971, 2971 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11514", "outputIndexes": [ 2972 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11515", "outputIndexes": [ 2973 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11517", "outputIndexes": [ 2974 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2974 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11518", "outputIndexes": [ 2975 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2970, 2973, 2975, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11521", "outputIndexes": [ 2976 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2976 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11522", "outputIndexes": [ 2977 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 2977 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11523", "outputIndexes": [ 2978 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978, 2977 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11524", "outputIndexes": [ 2979 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2969, 2979, 2972 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_5_output_0", "outputIndexes": [ 2980 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_1_output_0", "outputIndexes": [ 2981 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2981, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2982 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967, 2982, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_3_output_0", "outputIndexes": [ 2983 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2983 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_1_output_0", "outputIndexes": [ 2984 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2981, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967, 22, 2985, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_2_output_0", "outputIndexes": [ 2986 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984, 2986 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_4_output_0", "outputIndexes": [ 2987 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2987, 2958 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_3_output_0", "outputIndexes": [ 2988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2968, 2988 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_1_output_0", "outputIndexes": [ 2989 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4613 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3270799466, 2097174, 524288, 0, 0 ] } , "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": [ 4622 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4622 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4623 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4623 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2990 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2991 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2920, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2992 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2991, 2992, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_2_output_0", "outputIndexes": [ 2993 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990, 2993 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_2_output_0", "outputIndexes": [ 2994 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2960, 2989, 2994, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.27/self_attn/Reshape_7_output_0", "outputIndexes": [ 2995 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2995 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4624 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4624 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4625 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4625 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3273420928, 8388630, 2097152, 0, 0 ] } , "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": [ 4626 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4626 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4627 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4627 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2996 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899, 2996 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_output_0", "outputIndexes": [ 2997 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2997 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3283906710, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.27/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2998 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2998 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4628 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4628 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4629 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4629 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3283939478, 25165846, 6291456, 0, 0 ] } , "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": [ 4630 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4630 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4631 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4631 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2999 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2999 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.27/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3000 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4629 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3315396780, 25165846, 6291456, 0, 0 ] } , "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": [ 4634 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4634 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4635 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4635 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3001 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3000, 3001 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/mlp/Mul_output_0", "outputIndexes": [ 3002 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3002 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4636 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4636 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4637 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4637 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3346854082, 25165846, 6291456, 0, 0 ] } , "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": [ 4638 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4638 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4639 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4639 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3003 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2997, 3003 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_1_output_0", "outputIndexes": [ 3004 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3004, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/Reshape_output_0", "outputIndexes": [ 3005 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3378311384, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.28/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3006 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4640 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4640 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4641 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4641 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3378344152, 8388630, 2097152, 0, 0 ] } , "name": "/layers.28/self_attn/q_proj/Linear", "outputIndexes": [ 4642 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4642 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4643 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4643 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3007 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_output_0", "outputIndexes": [ 3008 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3008 ] , "main_type": "NONE", "name": "Shape11869", "outputIndexes": [ 3009 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3008 ] , "main_type": "NONE", "name": "Rank11871", "outputIndexes": [ 3010 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3010, 3010 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11873", "outputIndexes": [ 3011 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11874", "outputIndexes": [ 3012 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11876", "outputIndexes": [ 3013 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3013 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11877", "outputIndexes": [ 3014 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009, 3012, 3014, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11880", "outputIndexes": [ 3015 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3015 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11881", "outputIndexes": [ 3016 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3016, 3016 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11883", "outputIndexes": [ 3017 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3008, 3017, 3011 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_output_0", "outputIndexes": [ 3018 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3019 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11891", "outputIndexes": [ 3020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3013 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11894", "outputIndexes": [ 3021 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009, 3020, 3021, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11897", "outputIndexes": [ 3022 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3022 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11898", "outputIndexes": [ 3023 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3023 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11899", "outputIndexes": [ 3024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3024, 3023 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11900", "outputIndexes": [ 3025 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3008, 3025, 3011 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_1_output_0", "outputIndexes": [ 3026 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3027 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3019, 3027, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_output_0", "outputIndexes": [ 3028 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3007, 3028 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_output_0", "outputIndexes": [ 3029 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3029 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3388829934, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.28/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3031 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11918", "outputIndexes": [ 3032 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11921", "outputIndexes": [ 3033 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3032, 3033, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11924", "outputIndexes": [ 3034 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11925", "outputIndexes": [ 3035 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3035, 3035 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11927", "outputIndexes": [ 3036 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3036, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_2_output_0", "outputIndexes": [ 3037 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031, 3037 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_output_0", "outputIndexes": [ 3038 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_2_output_0", "outputIndexes": [ 3039 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3039 ] , "main_type": "NONE", "name": "Shape12051", "outputIndexes": [ 3040 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3039 ] , "main_type": "NONE", "name": "Rank12053", "outputIndexes": [ 3041 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3041, 3041 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12055", "outputIndexes": [ 3042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3042 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12056", "outputIndexes": [ 3043 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3042, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12058", "outputIndexes": [ 3044 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3044 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12059", "outputIndexes": [ 3045 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040, 3043, 3045, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12062", "outputIndexes": [ 3046 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12063", "outputIndexes": [ 3047 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3047 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12064", "outputIndexes": [ 3048 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3048, 3047 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12065", "outputIndexes": [ 3049 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3039, 3049, 3042 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_4_output_0", "outputIndexes": [ 3050 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3050, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_output_0", "outputIndexes": [ 3051 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3051, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3052 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031, 3052, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_1_output_0", "outputIndexes": [ 3053 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3053 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_output_0", "outputIndexes": [ 3054 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3051, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031, 22, 3055, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_output_0", "outputIndexes": [ 3056 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3054, 3056 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_3_output_0", "outputIndexes": [ 3057 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11960", "outputIndexes": [ 3058 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11963", "outputIndexes": [ 3059 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3058, 3059, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11966", "outputIndexes": [ 3060 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3060 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11967", "outputIndexes": [ 3061 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3061 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11968", "outputIndexes": [ 3062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3062, 3061 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11969", "outputIndexes": [ 3063 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3063, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_3_output_0", "outputIndexes": [ 3064 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3057, 3064 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_1_output_0", "outputIndexes": [ 3065 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038, 3065 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_output_0", "outputIndexes": [ 3066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4641 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3388830958, 2097174, 524288, 0, 0 ] } , "name": "/layers.28/self_attn/k_proj/Linear", "outputIndexes": [ 4646 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4646 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4647 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4647 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3067 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3068 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3069 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068, 3069, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_1_output_0", "outputIndexes": [ 3070 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3067, 3070 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_1_output_0", "outputIndexes": [ 3071 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3071 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3391452420, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.28/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3073 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073, 3037 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_2_output_0", "outputIndexes": [ 3074 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_3_output_0", "outputIndexes": [ 3075 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3075 ] , "main_type": "NONE", "name": "Shape11931", "outputIndexes": [ 3076 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3075 ] , "main_type": "NONE", "name": "Rank11933", "outputIndexes": [ 3077 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3077, 3077 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11935", "outputIndexes": [ 3078 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3078 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11936", "outputIndexes": [ 3079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3078, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11938", "outputIndexes": [ 3080 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3080 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11939", "outputIndexes": [ 3081 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3076, 3079, 3081, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11942", "outputIndexes": [ 3082 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11943", "outputIndexes": [ 3083 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3083 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11944", "outputIndexes": [ 3084 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084, 3083 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11945", "outputIndexes": [ 3085 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3075, 3085, 3078 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_5_output_0", "outputIndexes": [ 3086 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3086, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_1_output_0", "outputIndexes": [ 3087 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3088 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073, 3088, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_3_output_0", "outputIndexes": [ 3089 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_1_output_0", "outputIndexes": [ 3090 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3091 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073, 22, 3091, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_2_output_0", "outputIndexes": [ 3092 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3090, 3092 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_4_output_0", "outputIndexes": [ 3093 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3093, 3064 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_3_output_0", "outputIndexes": [ 3094 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074, 3094 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_1_output_0", "outputIndexes": [ 3095 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4641 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3391453444, 2097174, 524288, 0, 0 ] } , "name": "/layers.28/self_attn/v_proj/Linear", "outputIndexes": [ 4650 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4650 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4651 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4651 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3096 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3097 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3098 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3097, 3098, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_2_output_0", "outputIndexes": [ 3099 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096, 3099 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_2_output_0", "outputIndexes": [ 3100 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066, 3095, 3100, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.28/self_attn/Reshape_7_output_0", "outputIndexes": [ 3101 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3101 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4652 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4652 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4653 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4653 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3394074906, 8388630, 2097152, 0, 0 ] } , "name": "/layers.28/self_attn/o_proj/Linear", "outputIndexes": [ 4654 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4654 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4655 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4655 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3102 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005, 3102 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_output_0", "outputIndexes": [ 3103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3103 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3404560688, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.28/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3104 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3104 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4656 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4656 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4657 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4657 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3404593456, 25165846, 6291456, 0, 0 ] } , "name": "/layers.28/mlp/gate_proj/Linear", "outputIndexes": [ 4658 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4658 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4659 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4659 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3105 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.28/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3106 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4657 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3436050758, 25165846, 6291456, 0, 0 ] } , "name": "/layers.28/mlp/up_proj/Linear", "outputIndexes": [ 4662 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4662 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4663 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4663 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3107 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3106, 3107 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/mlp/Mul_output_0", "outputIndexes": [ 3108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3108 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4664 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4664 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4665 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4665 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3467508060, 25165846, 6291456, 0, 0 ] } , "name": "/layers.28/mlp/down_proj/Linear", "outputIndexes": [ 4666 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4666 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4667 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4667 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3109 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3103, 3109 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_1_output_0", "outputIndexes": [ 3110 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3110, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/Reshape_output_0", "outputIndexes": [ 3111 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3498965362, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.29/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3112 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4668 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4668 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4669 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4669 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3498998130, 8388630, 2097152, 0, 0 ] } , "name": "/layers.29/self_attn/q_proj/Linear", "outputIndexes": [ 4670 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4670 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4671 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4671 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3113 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_output_0", "outputIndexes": [ 3114 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3114 ] , "main_type": "NONE", "name": "Shape12290", "outputIndexes": [ 3115 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3114 ] , "main_type": "NONE", "name": "Rank12292", "outputIndexes": [ 3116 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3116, 3116 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12294", "outputIndexes": [ 3117 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12295", "outputIndexes": [ 3118 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12297", "outputIndexes": [ 3119 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3119 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12298", "outputIndexes": [ 3120 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3115, 3118, 3120, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12301", "outputIndexes": [ 3121 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3121 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12302", "outputIndexes": [ 3122 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3122, 3122 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12304", "outputIndexes": [ 3123 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3114, 3123, 3117 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_output_0", "outputIndexes": [ 3124 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12312", "outputIndexes": [ 3126 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3119 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12315", "outputIndexes": [ 3127 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3115, 3126, 3127, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12318", "outputIndexes": [ 3128 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3128 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12319", "outputIndexes": [ 3129 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3129 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12320", "outputIndexes": [ 3130 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130, 3129 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12321", "outputIndexes": [ 3131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3114, 3131, 3117 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_1_output_0", "outputIndexes": [ 3132 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3132, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3133 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3125, 3133, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_output_0", "outputIndexes": [ 3134 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3113, 3134 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_output_0", "outputIndexes": [ 3135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3135 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3509483912, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.29/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3137 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12339", "outputIndexes": [ 3138 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12342", "outputIndexes": [ 3139 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3138, 3139, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12345", "outputIndexes": [ 3140 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12346", "outputIndexes": [ 3141 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3141, 3141 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12348", "outputIndexes": [ 3142 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3142, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_2_output_0", "outputIndexes": [ 3143 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137, 3143 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_output_0", "outputIndexes": [ 3144 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_2_output_0", "outputIndexes": [ 3145 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3145 ] , "main_type": "NONE", "name": "Shape12472", "outputIndexes": [ 3146 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3145 ] , "main_type": "NONE", "name": "Rank12474", "outputIndexes": [ 3147 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3147, 3147 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12476", "outputIndexes": [ 3148 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3148 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12477", "outputIndexes": [ 3149 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3148, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12479", "outputIndexes": [ 3150 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12480", "outputIndexes": [ 3151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3146, 3149, 3151, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12483", "outputIndexes": [ 3152 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12484", "outputIndexes": [ 3153 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3153 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12485", "outputIndexes": [ 3154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3154, 3153 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12486", "outputIndexes": [ 3155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3145, 3155, 3148 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_4_output_0", "outputIndexes": [ 3156 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3156, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_output_0", "outputIndexes": [ 3157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3157, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3158 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137, 3158, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_1_output_0", "outputIndexes": [ 3159 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3159 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_output_0", "outputIndexes": [ 3160 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3157, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3161 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137, 22, 3161, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_output_0", "outputIndexes": [ 3162 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3160, 3162 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_3_output_0", "outputIndexes": [ 3163 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12381", "outputIndexes": [ 3164 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12384", "outputIndexes": [ 3165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3164, 3165, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12387", "outputIndexes": [ 3166 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12388", "outputIndexes": [ 3167 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3167 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12389", "outputIndexes": [ 3168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168, 3167 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12390", "outputIndexes": [ 3169 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3169, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_3_output_0", "outputIndexes": [ 3170 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3163, 3170 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_1_output_0", "outputIndexes": [ 3171 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3144, 3171 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_output_0", "outputIndexes": [ 3172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4669 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3509484936, 2097174, 524288, 0, 0 ] } , "name": "/layers.29/self_attn/k_proj/Linear", "outputIndexes": [ 4674 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4674 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4675 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4675 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3174 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3132, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3175 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174, 3175, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_1_output_0", "outputIndexes": [ 3176 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3173, 3176 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_1_output_0", "outputIndexes": [ 3177 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3177 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3512106398, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.29/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3179 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179, 3143 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_2_output_0", "outputIndexes": [ 3180 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_3_output_0", "outputIndexes": [ 3181 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3181 ] , "main_type": "NONE", "name": "Shape12352", "outputIndexes": [ 3182 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3181 ] , "main_type": "NONE", "name": "Rank12354", "outputIndexes": [ 3183 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3183, 3183 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12356", "outputIndexes": [ 3184 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3184 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12357", "outputIndexes": [ 3185 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3184, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12359", "outputIndexes": [ 3186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3186 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12360", "outputIndexes": [ 3187 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3182, 3185, 3187, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12363", "outputIndexes": [ 3188 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3188 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12364", "outputIndexes": [ 3189 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3189 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12365", "outputIndexes": [ 3190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3190, 3189 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12366", "outputIndexes": [ 3191 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3181, 3191, 3184 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_5_output_0", "outputIndexes": [ 3192 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3192, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_1_output_0", "outputIndexes": [ 3193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3193, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179, 3194, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_3_output_0", "outputIndexes": [ 3195 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_1_output_0", "outputIndexes": [ 3196 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3193, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3197 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179, 22, 3197, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_2_output_0", "outputIndexes": [ 3198 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3196, 3198 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_4_output_0", "outputIndexes": [ 3199 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3199, 3170 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_3_output_0", "outputIndexes": [ 3200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180, 3200 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_1_output_0", "outputIndexes": [ 3201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4669 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3512107422, 2097174, 524288, 0, 0 ] } , "name": "/layers.29/self_attn/v_proj/Linear", "outputIndexes": [ 4678 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4678 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4679 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4679 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3202 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3203 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3132, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3203, 3204, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_2_output_0", "outputIndexes": [ 3205 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202, 3205 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_2_output_0", "outputIndexes": [ 3206 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3172, 3201, 3206, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.29/self_attn/Reshape_7_output_0", "outputIndexes": [ 3207 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3207 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4680 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4680 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4681 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4681 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3514728884, 8388630, 2097152, 0, 0 ] } , "name": "/layers.29/self_attn/o_proj/Linear", "outputIndexes": [ 4682 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4682 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4683 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4683 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3208 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111, 3208 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_output_0", "outputIndexes": [ 3209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3209 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3525214666, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.29/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3210 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3210 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4684 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4684 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4685 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4685 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3525247434, 25165846, 6291456, 0, 0 ] } , "name": "/layers.29/mlp/gate_proj/Linear", "outputIndexes": [ 4686 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4686 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4687 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4687 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3211 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3211 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.29/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3212 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4685 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3556704736, 25165846, 6291456, 0, 0 ] } , "name": "/layers.29/mlp/up_proj/Linear", "outputIndexes": [ 4690 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4690 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4691 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4691 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3213 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3212, 3213 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/mlp/Mul_output_0", "outputIndexes": [ 3214 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4692 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4692 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4693 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4693 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3588162038, 25165846, 6291456, 0, 0 ] } , "name": "/layers.29/mlp/down_proj/Linear", "outputIndexes": [ 4694 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4694 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4695 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4695 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3209, 3215 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_1_output_0", "outputIndexes": [ 3216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3216, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/Reshape_output_0", "outputIndexes": [ 3217 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3217 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3619619340, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.30/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3218 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3218 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4696 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4696 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4697 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4697 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3619652108, 8388630, 2097152, 0, 0 ] } , "name": "/layers.30/self_attn/q_proj/Linear", "outputIndexes": [ 4698 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4698 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4699 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4699 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3219 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3218 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_output_0", "outputIndexes": [ 3220 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3220 ] , "main_type": "NONE", "name": "Shape12711", "outputIndexes": [ 3221 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3220 ] , "main_type": "NONE", "name": "Rank12713", "outputIndexes": [ 3222 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3222, 3222 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12715", "outputIndexes": [ 3223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12716", "outputIndexes": [ 3224 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12718", "outputIndexes": [ 3225 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3225 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12719", "outputIndexes": [ 3226 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3221, 3224, 3226, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12722", "outputIndexes": [ 3227 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3227 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12723", "outputIndexes": [ 3228 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3228, 3228 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12725", "outputIndexes": [ 3229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220, 3229, 3223 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_output_0", "outputIndexes": [ 3230 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12733", "outputIndexes": [ 3232 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3225 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12736", "outputIndexes": [ 3233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3221, 3232, 3233, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12739", "outputIndexes": [ 3234 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12740", "outputIndexes": [ 3235 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3235 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12741", "outputIndexes": [ 3236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236, 3235 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12742", "outputIndexes": [ 3237 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220, 3237, 3223 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_1_output_0", "outputIndexes": [ 3238 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3239 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3231, 3239, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_output_0", "outputIndexes": [ 3240 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3219, 3240 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_output_0", "outputIndexes": [ 3241 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3241 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3630137890, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.30/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3243 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12760", "outputIndexes": [ 3244 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12763", "outputIndexes": [ 3245 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3244, 3245, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12766", "outputIndexes": [ 3246 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3246 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12767", "outputIndexes": [ 3247 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3247, 3247 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12769", "outputIndexes": [ 3248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3248, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_2_output_0", "outputIndexes": [ 3249 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243, 3249 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_output_0", "outputIndexes": [ 3250 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_2_output_0", "outputIndexes": [ 3251 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3251 ] , "main_type": "NONE", "name": "Shape12893", "outputIndexes": [ 3252 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3251 ] , "main_type": "NONE", "name": "Rank12895", "outputIndexes": [ 3253 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3253, 3253 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12897", "outputIndexes": [ 3254 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3254 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12898", "outputIndexes": [ 3255 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3254, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12900", "outputIndexes": [ 3256 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3256 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12901", "outputIndexes": [ 3257 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252, 3255, 3257, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12904", "outputIndexes": [ 3258 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3258 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12905", "outputIndexes": [ 3259 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3259 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12906", "outputIndexes": [ 3260 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3260, 3259 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12907", "outputIndexes": [ 3261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3251, 3261, 3254 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_4_output_0", "outputIndexes": [ 3262 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_output_0", "outputIndexes": [ 3263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3263, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243, 3264, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_1_output_0", "outputIndexes": [ 3265 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3265 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_output_0", "outputIndexes": [ 3266 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3263, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3267 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243, 22, 3267, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_output_0", "outputIndexes": [ 3268 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3266, 3268 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_3_output_0", "outputIndexes": [ 3269 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12802", "outputIndexes": [ 3270 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12805", "outputIndexes": [ 3271 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3270, 3271, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12808", "outputIndexes": [ 3272 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3272 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12809", "outputIndexes": [ 3273 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3273 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12810", "outputIndexes": [ 3274 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3274, 3273 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12811", "outputIndexes": [ 3275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3275, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_3_output_0", "outputIndexes": [ 3276 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3269, 3276 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_1_output_0", "outputIndexes": [ 3277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3250, 3277 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_output_0", "outputIndexes": [ 3278 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4697 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3630138914, 2097174, 524288, 0, 0 ] } , "name": "/layers.30/self_attn/k_proj/Linear", "outputIndexes": [ 4702 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4702 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4703 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4703 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3279 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3280 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3281 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280, 3281, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_1_output_0", "outputIndexes": [ 3282 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3279, 3282 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_1_output_0", "outputIndexes": [ 3283 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3283 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3632760376, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.30/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3285 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285, 3249 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_2_output_0", "outputIndexes": [ 3286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_3_output_0", "outputIndexes": [ 3287 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3287 ] , "main_type": "NONE", "name": "Shape12773", "outputIndexes": [ 3288 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3287 ] , "main_type": "NONE", "name": "Rank12775", "outputIndexes": [ 3289 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3289, 3289 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12777", "outputIndexes": [ 3290 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12778", "outputIndexes": [ 3291 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12780", "outputIndexes": [ 3292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12781", "outputIndexes": [ 3293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288, 3291, 3293, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12784", "outputIndexes": [ 3294 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3294 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12785", "outputIndexes": [ 3295 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3295 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12786", "outputIndexes": [ 3296 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3296, 3295 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12787", "outputIndexes": [ 3297 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3287, 3297, 3290 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_5_output_0", "outputIndexes": [ 3298 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_1_output_0", "outputIndexes": [ 3299 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3299, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3300 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285, 3300, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_3_output_0", "outputIndexes": [ 3301 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3301 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_1_output_0", "outputIndexes": [ 3302 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3299, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285, 22, 3303, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_2_output_0", "outputIndexes": [ 3304 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3302, 3304 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_4_output_0", "outputIndexes": [ 3305 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3305, 3276 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_3_output_0", "outputIndexes": [ 3306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286, 3306 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_1_output_0", "outputIndexes": [ 3307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4697 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3632761400, 2097174, 524288, 0, 0 ] } , "name": "/layers.30/self_attn/v_proj/Linear", "outputIndexes": [ 4706 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4706 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4707 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4707 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3308 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3309 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3310 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3309, 3310, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_2_output_0", "outputIndexes": [ 3311 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3308, 3311 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_2_output_0", "outputIndexes": [ 3312 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3278, 3307, 3312, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.30/self_attn/Reshape_7_output_0", "outputIndexes": [ 3313 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3313 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4708 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4708 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4709 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4709 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3635382862, 8388630, 2097152, 0, 0 ] } , "name": "/layers.30/self_attn/o_proj/Linear", "outputIndexes": [ 4710 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4710 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4711 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4711 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3314 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3217, 3314 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_output_0", "outputIndexes": [ 3315 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3645868644, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.30/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3316 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3316 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4712 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4712 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4713 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4713 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3645901412, 25165846, 6291456, 0, 0 ] } , "name": "/layers.30/mlp/gate_proj/Linear", "outputIndexes": [ 4714 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4714 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4715 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4715 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3317 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3317 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.30/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3318 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4713 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3677358714, 25165846, 6291456, 0, 0 ] } , "name": "/layers.30/mlp/up_proj/Linear", "outputIndexes": [ 4718 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4718 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4719 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4719 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3319 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3318, 3319 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/mlp/Mul_output_0", "outputIndexes": [ 3320 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4720 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4721 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4721 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3708816016, 25165846, 6291456, 0, 0 ] } , "name": "/layers.30/mlp/down_proj/Linear", "outputIndexes": [ 4722 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4722 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4723 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4723 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3321 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315, 3321 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_1_output_0", "outputIndexes": [ 3322 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/Reshape_output_0", "outputIndexes": [ 3323 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3323 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3740273318, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.31/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3324 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3324 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4724 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4724 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4725 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4725 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3740306086, 8388630, 2097152, 0, 0 ] } , "name": "/layers.31/self_attn/q_proj/Linear", "outputIndexes": [ 4726 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4726 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4727 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4727 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3325 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3324 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_output_0", "outputIndexes": [ 3326 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3326 ] , "main_type": "NONE", "name": "Shape13132", "outputIndexes": [ 3327 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3326 ] , "main_type": "NONE", "name": "Rank13134", "outputIndexes": [ 3328 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3328, 3328 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13136", "outputIndexes": [ 3329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13137", "outputIndexes": [ 3330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13139", "outputIndexes": [ 3331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13140", "outputIndexes": [ 3332 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327, 3330, 3332, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13143", "outputIndexes": [ 3333 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3333 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13144", "outputIndexes": [ 3334 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3334, 3334 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13146", "outputIndexes": [ 3335 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326, 3335, 3329 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_output_0", "outputIndexes": [ 3336 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13154", "outputIndexes": [ 3338 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13157", "outputIndexes": [ 3339 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327, 3338, 3339, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13160", "outputIndexes": [ 3340 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3340 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13161", "outputIndexes": [ 3341 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3341 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13162", "outputIndexes": [ 3342 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342, 3341 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13163", "outputIndexes": [ 3343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326, 3343, 3329 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_1_output_0", "outputIndexes": [ 3344 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3345 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3337, 3345, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_output_0", "outputIndexes": [ 3346 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3325, 3346 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_output_0", "outputIndexes": [ 3347 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3347 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3750791868, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.31/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3349 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13181", "outputIndexes": [ 3350 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13184", "outputIndexes": [ 3351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3350, 3351, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13187", "outputIndexes": [ 3352 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3352 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13188", "outputIndexes": [ 3353 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3353, 3353 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13190", "outputIndexes": [ 3354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3354, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_2_output_0", "outputIndexes": [ 3355 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349, 3355 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_output_0", "outputIndexes": [ 3356 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_2_output_0", "outputIndexes": [ 3357 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3357 ] , "main_type": "NONE", "name": "Shape13314", "outputIndexes": [ 3358 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3357 ] , "main_type": "NONE", "name": "Rank13316", "outputIndexes": [ 3359 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3359, 3359 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13318", "outputIndexes": [ 3360 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13319", "outputIndexes": [ 3361 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13321", "outputIndexes": [ 3362 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3362 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13322", "outputIndexes": [ 3363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3358, 3361, 3363, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13325", "outputIndexes": [ 3364 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13326", "outputIndexes": [ 3365 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3365 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13327", "outputIndexes": [ 3366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366, 3365 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13328", "outputIndexes": [ 3367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3357, 3367, 3360 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_4_output_0", "outputIndexes": [ 3368 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3368, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_output_0", "outputIndexes": [ 3369 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3369, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349, 3370, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_1_output_0", "outputIndexes": [ 3371 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3371 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_output_0", "outputIndexes": [ 3372 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3369, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3373 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349, 22, 3373, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_output_0", "outputIndexes": [ 3374 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3372, 3374 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_3_output_0", "outputIndexes": [ 3375 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13223", "outputIndexes": [ 3376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13226", "outputIndexes": [ 3377 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3376, 3377, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13229", "outputIndexes": [ 3378 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3378 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13230", "outputIndexes": [ 3379 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3379 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13231", "outputIndexes": [ 3380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3380, 3379 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13232", "outputIndexes": [ 3381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3381, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_3_output_0", "outputIndexes": [ 3382 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3375, 3382 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_1_output_0", "outputIndexes": [ 3383 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3356, 3383 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_output_0", "outputIndexes": [ 3384 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4725 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3750792892, 2097174, 524288, 0, 0 ] } , "name": "/layers.31/self_attn/k_proj/Linear", "outputIndexes": [ 4730 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4730 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4731 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4731 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3385 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3386 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3387 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386, 3387, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_1_output_0", "outputIndexes": [ 3388 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3385, 3388 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_1_output_0", "outputIndexes": [ 3389 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3389 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3753414354, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.31/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3391 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391, 3355 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_2_output_0", "outputIndexes": [ 3392 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_3_output_0", "outputIndexes": [ 3393 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3393 ] , "main_type": "NONE", "name": "Shape13194", "outputIndexes": [ 3394 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3393 ] , "main_type": "NONE", "name": "Rank13196", "outputIndexes": [ 3395 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3395, 3395 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13198", "outputIndexes": [ 3396 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3396 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13199", "outputIndexes": [ 3397 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3396, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13201", "outputIndexes": [ 3398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3398 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13202", "outputIndexes": [ 3399 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3394, 3397, 3399, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13205", "outputIndexes": [ 3400 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13206", "outputIndexes": [ 3401 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3401 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13207", "outputIndexes": [ 3402 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402, 3401 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13208", "outputIndexes": [ 3403 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3393, 3403, 3396 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_5_output_0", "outputIndexes": [ 3404 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_1_output_0", "outputIndexes": [ 3405 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3405, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3406 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391, 3406, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_3_output_0", "outputIndexes": [ 3407 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3407 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_1_output_0", "outputIndexes": [ 3408 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3405, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391, 22, 3409, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_2_output_0", "outputIndexes": [ 3410 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3408, 3410 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_4_output_0", "outputIndexes": [ 3411 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3411, 3382 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_3_output_0", "outputIndexes": [ 3412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3392, 3412 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_1_output_0", "outputIndexes": [ 3413 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4725 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3753415378, 2097174, 524288, 0, 0 ] } , "name": "/layers.31/self_attn/v_proj/Linear", "outputIndexes": [ 4734 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4734 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4735 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4735 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3414 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3415 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415, 3416, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_2_output_0", "outputIndexes": [ 3417 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3414, 3417 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_2_output_0", "outputIndexes": [ 3418 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3384, 3413, 3418, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.31/self_attn/Reshape_7_output_0", "outputIndexes": [ 3419 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3419 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4736 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4736 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4737 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4737 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3756036840, 8388630, 2097152, 0, 0 ] } , "name": "/layers.31/self_attn/o_proj/Linear", "outputIndexes": [ 4738 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4738 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4739 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4739 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3420 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3323, 3420 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_output_0", "outputIndexes": [ 3421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3421 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3766522622, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.31/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3422 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3422 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4740 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4740 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4741 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4741 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3766555390, 25165846, 6291456, 0, 0 ] } , "name": "/layers.31/mlp/gate_proj/Linear", "outputIndexes": [ 4742 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4742 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4743 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4743 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3423 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3423 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.31/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3424 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4741 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3798012692, 25165846, 6291456, 0, 0 ] } , "name": "/layers.31/mlp/up_proj/Linear", "outputIndexes": [ 4746 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4746 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4747 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4747 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3425 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3424, 3425 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/mlp/Mul_output_0", "outputIndexes": [ 3426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4748 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4748 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4749 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4749 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3829469994, 25165846, 6291456, 0, 0 ] } , "name": "/layers.31/mlp/down_proj/Linear", "outputIndexes": [ 4750 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4750 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4751 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4751 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3427 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3421, 3427 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_1_output_0", "outputIndexes": [ 3428 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3428, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.32/Reshape_output_0", "outputIndexes": [ 3429 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3860927296, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.32/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3430 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4752 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4752 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4753 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4753 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3860960064, 8388630, 2097152, 0, 0 ] } , "name": "/layers.32/self_attn/q_proj/Linear", "outputIndexes": [ 4754 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4754 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4755 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4755 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3431 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "NONE", "name": "/blocks.32/self_attn/Shape_output_0", "outputIndexes": [ 3432 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3432 ] , "main_type": "NONE", "name": "Shape13553", "outputIndexes": [ 3433 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3432 ] , "main_type": "NONE", "name": "Rank13555", "outputIndexes": [ 3434 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3434, 3434 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13557", "outputIndexes": [ 3435 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13558", "outputIndexes": [ 3436 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13560", "outputIndexes": [ 3437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3437 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13561", "outputIndexes": [ 3438 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3433, 3436, 3438, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13564", "outputIndexes": [ 3439 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3439 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13565", "outputIndexes": [ 3440 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3440, 3440 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13567", "outputIndexes": [ 3441 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432, 3441, 3435 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_output_0", "outputIndexes": [ 3442 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3442, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3443 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13575", "outputIndexes": [ 3444 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3437 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13578", "outputIndexes": [ 3445 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3433, 3444, 3445, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13581", "outputIndexes": [ 3446 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3446 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13582", "outputIndexes": [ 3447 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3447 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13583", "outputIndexes": [ 3448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3448, 3447 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13584", "outputIndexes": [ 3449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432, 3449, 3435 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_1_output_0", "outputIndexes": [ 3450 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3450, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3451 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3443, 3451, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.32/self_attn/Concat_output_0", "outputIndexes": [ 3452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3431, 3452 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.32/self_attn/Reshape_output_0", "outputIndexes": [ 3453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3453 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3871445846, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.32/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3455 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13602", "outputIndexes": [ 3456 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13605", "outputIndexes": [ 3457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3456, 3457, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13608", "outputIndexes": [ 3458 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13609", "outputIndexes": [ 3459 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3459, 3459 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13611", "outputIndexes": [ 3460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3460, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_2_output_0", "outputIndexes": [ 3461 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455, 3461 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Mul_output_0", "outputIndexes": [ 3462 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455 ] , "main_type": "NONE", "name": "/blocks.32/self_attn/Shape_2_output_0", "outputIndexes": [ 3463 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3463 ] , "main_type": "NONE", "name": "Shape13735", "outputIndexes": [ 3464 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3463 ] , "main_type": "NONE", "name": "Rank13737", "outputIndexes": [ 3465 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3465, 3465 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13739", "outputIndexes": [ 3466 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3466 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13740", "outputIndexes": [ 3467 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3466, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13742", "outputIndexes": [ 3468 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3468 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13743", "outputIndexes": [ 3469 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3464, 3467, 3469, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13746", "outputIndexes": [ 3470 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3470 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13747", "outputIndexes": [ 3471 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3471 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13748", "outputIndexes": [ 3472 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3472, 3471 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13749", "outputIndexes": [ 3473 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3463, 3473, 3466 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_4_output_0", "outputIndexes": [ 3474 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3474, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Div_output_0", "outputIndexes": [ 3475 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3475, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3476 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455, 3476, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.32/self_attn/Slice_1_output_0", "outputIndexes": [ 3477 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3477 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.32/self_attn/Neg_output_0", "outputIndexes": [ 3478 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3475, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455, 22, 3479, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.32/self_attn/Slice_output_0", "outputIndexes": [ 3480 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3478, 3480 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.32/self_attn/Concat_3_output_0", "outputIndexes": [ 3481 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13644", "outputIndexes": [ 3482 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13647", "outputIndexes": [ 3483 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3482, 3483, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13650", "outputIndexes": [ 3484 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3484 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13651", "outputIndexes": [ 3485 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3485 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13652", "outputIndexes": [ 3486 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486, 3485 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13653", "outputIndexes": [ 3487 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3487, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_3_output_0", "outputIndexes": [ 3488 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3481, 3488 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Mul_1_output_0", "outputIndexes": [ 3489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3462, 3489 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Add_output_0", "outputIndexes": [ 3490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4753 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3871446870, 2097174, 524288, 0, 0 ] } , "name": "/layers.32/self_attn/k_proj/Linear", "outputIndexes": [ 4758 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4758 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4759 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4759 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3491 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3442, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3492 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3450, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3493 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3492, 3493, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.32/self_attn/Concat_1_output_0", "outputIndexes": [ 3494 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3491, 3494 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.32/self_attn/Reshape_1_output_0", "outputIndexes": [ 3495 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3495 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3874068332, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.32/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3497 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497, 3461 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Mul_2_output_0", "outputIndexes": [ 3498 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497 ] , "main_type": "NONE", "name": "/blocks.32/self_attn/Shape_3_output_0", "outputIndexes": [ 3499 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3499 ] , "main_type": "NONE", "name": "Shape13615", "outputIndexes": [ 3500 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3499 ] , "main_type": "NONE", "name": "Rank13617", "outputIndexes": [ 3501 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3501, 3501 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13619", "outputIndexes": [ 3502 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13620", "outputIndexes": [ 3503 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13622", "outputIndexes": [ 3504 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3504 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13623", "outputIndexes": [ 3505 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3500, 3503, 3505, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13626", "outputIndexes": [ 3506 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3506 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13627", "outputIndexes": [ 3507 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3507 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13628", "outputIndexes": [ 3508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3508, 3507 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13629", "outputIndexes": [ 3509 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3499, 3509, 3502 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.32/self_attn/Gather_5_output_0", "outputIndexes": [ 3510 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3510, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Div_1_output_0", "outputIndexes": [ 3511 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3511, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3512 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497, 3512, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.32/self_attn/Slice_3_output_0", "outputIndexes": [ 3513 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.32/self_attn/Neg_1_output_0", "outputIndexes": [ 3514 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3511, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497, 22, 3515, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.32/self_attn/Slice_2_output_0", "outputIndexes": [ 3516 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514, 3516 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.32/self_attn/Concat_4_output_0", "outputIndexes": [ 3517 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3517, 3488 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Mul_3_output_0", "outputIndexes": [ 3518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3498, 3518 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/self_attn/Add_1_output_0", "outputIndexes": [ 3519 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4753 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3874069356, 2097174, 524288, 0, 0 ] } , "name": "/layers.32/self_attn/v_proj/Linear", "outputIndexes": [ 4762 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4762 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4763 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4763 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3520 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3442, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3450, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.32/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3522 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3521, 3522, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.32/self_attn/Concat_2_output_0", "outputIndexes": [ 3523 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3520, 3523 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.32/self_attn/Reshape_2_output_0", "outputIndexes": [ 3524 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3490, 3519, 3524, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.32/self_attn/Reshape_7_output_0", "outputIndexes": [ 3525 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3525 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4764 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4764 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4765 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4765 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3876690818, 8388630, 2097152, 0, 0 ] } , "name": "/layers.32/self_attn/o_proj/Linear", "outputIndexes": [ 4766 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4766 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4767 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4767 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3526 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429, 3526 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/Add_output_0", "outputIndexes": [ 3527 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3527 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3887176600, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.32/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3528 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3528 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4768 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4768 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4769 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4769 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3887209368, 25165846, 6291456, 0, 0 ] } , "name": "/layers.32/mlp/gate_proj/Linear", "outputIndexes": [ 4770 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4770 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4771 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4771 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3529 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3529 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.32/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3530 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4769 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3918666670, 25165846, 6291456, 0, 0 ] } , "name": "/layers.32/mlp/up_proj/Linear", "outputIndexes": [ 4774 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4774 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4775 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4775 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3531 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3530, 3531 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/mlp/Mul_output_0", "outputIndexes": [ 3532 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3532 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4776 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4776 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4777 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4777 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3950123972, 25165846, 6291456, 0, 0 ] } , "name": "/layers.32/mlp/down_proj/Linear", "outputIndexes": [ 4778 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4778 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4779 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4779 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3533 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3527, 3533 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.32/Add_1_output_0", "outputIndexes": [ 3534 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3534, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.33/Reshape_output_0", "outputIndexes": [ 3535 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3535 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3981581274, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.33/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3536 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3536 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4780 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4780 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4781 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4781 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3981614042, 8388630, 2097152, 0, 0 ] } , "name": "/layers.33/self_attn/q_proj/Linear", "outputIndexes": [ 4782 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4782 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4783 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4783 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3537 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3536 ] , "main_type": "NONE", "name": "/blocks.33/self_attn/Shape_output_0", "outputIndexes": [ 3538 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3538 ] , "main_type": "NONE", "name": "Shape13974", "outputIndexes": [ 3539 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3538 ] , "main_type": "NONE", "name": "Rank13976", "outputIndexes": [ 3540 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3540, 3540 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13978", "outputIndexes": [ 3541 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13979", "outputIndexes": [ 3542 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13981", "outputIndexes": [ 3543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3543 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13982", "outputIndexes": [ 3544 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3539, 3542, 3544, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13985", "outputIndexes": [ 3545 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3545 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13986", "outputIndexes": [ 3546 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3546, 3546 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13988", "outputIndexes": [ 3547 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3538, 3547, 3541 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_output_0", "outputIndexes": [ 3548 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3548, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3549 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13996", "outputIndexes": [ 3550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3543 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13999", "outputIndexes": [ 3551 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3539, 3550, 3551, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14002", "outputIndexes": [ 3552 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3552 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14003", "outputIndexes": [ 3553 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3553 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14004", "outputIndexes": [ 3554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3554, 3553 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14005", "outputIndexes": [ 3555 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3538, 3555, 3541 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_1_output_0", "outputIndexes": [ 3556 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3557 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3549, 3557, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.33/self_attn/Concat_output_0", "outputIndexes": [ 3558 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3537, 3558 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.33/self_attn/Reshape_output_0", "outputIndexes": [ 3559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3559 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3992099824, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.33/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3561 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14023", "outputIndexes": [ 3562 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14026", "outputIndexes": [ 3563 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3562, 3563, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14029", "outputIndexes": [ 3564 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3564 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14030", "outputIndexes": [ 3565 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3565, 3565 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14032", "outputIndexes": [ 3566 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3566, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_2_output_0", "outputIndexes": [ 3567 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3561, 3567 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Mul_output_0", "outputIndexes": [ 3568 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3561 ] , "main_type": "NONE", "name": "/blocks.33/self_attn/Shape_2_output_0", "outputIndexes": [ 3569 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3569 ] , "main_type": "NONE", "name": "Shape14156", "outputIndexes": [ 3570 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3569 ] , "main_type": "NONE", "name": "Rank14158", "outputIndexes": [ 3571 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3571, 3571 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14160", "outputIndexes": [ 3572 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14161", "outputIndexes": [ 3573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14163", "outputIndexes": [ 3574 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3574 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14164", "outputIndexes": [ 3575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570, 3573, 3575, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14167", "outputIndexes": [ 3576 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3576 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14168", "outputIndexes": [ 3577 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3577 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14169", "outputIndexes": [ 3578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3578, 3577 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14170", "outputIndexes": [ 3579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569, 3579, 3572 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_4_output_0", "outputIndexes": [ 3580 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3580, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Div_output_0", "outputIndexes": [ 3581 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3581, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3582 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3561, 3582, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.33/self_attn/Slice_1_output_0", "outputIndexes": [ 3583 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3583 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.33/self_attn/Neg_output_0", "outputIndexes": [ 3584 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3581, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3585 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3561, 22, 3585, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.33/self_attn/Slice_output_0", "outputIndexes": [ 3586 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3584, 3586 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.33/self_attn/Concat_3_output_0", "outputIndexes": [ 3587 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14065", "outputIndexes": [ 3588 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14068", "outputIndexes": [ 3589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3588, 3589, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14071", "outputIndexes": [ 3590 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3590 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14072", "outputIndexes": [ 3591 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3591 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14073", "outputIndexes": [ 3592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3592, 3591 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14074", "outputIndexes": [ 3593 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3593, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_3_output_0", "outputIndexes": [ 3594 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3587, 3594 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Mul_1_output_0", "outputIndexes": [ 3595 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3568, 3595 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Add_output_0", "outputIndexes": [ 3596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4781 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3992100848, 2097174, 524288, 0, 0 ] } , "name": "/layers.33/self_attn/k_proj/Linear", "outputIndexes": [ 4786 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4786 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4787 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4787 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3597 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3548, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3598 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3599 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598, 3599, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.33/self_attn/Concat_1_output_0", "outputIndexes": [ 3600 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597, 3600 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.33/self_attn/Reshape_1_output_0", "outputIndexes": [ 3601 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3601 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3994722310, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.33/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3603 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603, 3567 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Mul_2_output_0", "outputIndexes": [ 3604 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603 ] , "main_type": "NONE", "name": "/blocks.33/self_attn/Shape_3_output_0", "outputIndexes": [ 3605 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3605 ] , "main_type": "NONE", "name": "Shape14036", "outputIndexes": [ 3606 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3605 ] , "main_type": "NONE", "name": "Rank14038", "outputIndexes": [ 3607 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3607, 3607 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14040", "outputIndexes": [ 3608 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3608 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14041", "outputIndexes": [ 3609 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3608, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14043", "outputIndexes": [ 3610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3610 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14044", "outputIndexes": [ 3611 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3606, 3609, 3611, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14047", "outputIndexes": [ 3612 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3612 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14048", "outputIndexes": [ 3613 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3613 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14049", "outputIndexes": [ 3614 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3614, 3613 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14050", "outputIndexes": [ 3615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3605, 3615, 3608 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.33/self_attn/Gather_5_output_0", "outputIndexes": [ 3616 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3616, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Div_1_output_0", "outputIndexes": [ 3617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3617, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603, 3618, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.33/self_attn/Slice_3_output_0", "outputIndexes": [ 3619 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3619 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.33/self_attn/Neg_1_output_0", "outputIndexes": [ 3620 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3617, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3621 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603, 22, 3621, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.33/self_attn/Slice_2_output_0", "outputIndexes": [ 3622 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3620, 3622 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.33/self_attn/Concat_4_output_0", "outputIndexes": [ 3623 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3623, 3594 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Mul_3_output_0", "outputIndexes": [ 3624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3604, 3624 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/self_attn/Add_1_output_0", "outputIndexes": [ 3625 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4781 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3994723334, 2097174, 524288, 0, 0 ] } , "name": "/layers.33/self_attn/v_proj/Linear", "outputIndexes": [ 4790 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4790 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4791 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4791 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3626 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3548, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3627 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.33/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3627, 3628, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.33/self_attn/Concat_2_output_0", "outputIndexes": [ 3629 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626, 3629 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.33/self_attn/Reshape_2_output_0", "outputIndexes": [ 3630 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3596, 3625, 3630, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.33/self_attn/Reshape_7_output_0", "outputIndexes": [ 3631 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3631 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4792 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4792 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4793 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4793 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3997344796, 8388630, 2097152, 0, 0 ] } , "name": "/layers.33/self_attn/o_proj/Linear", "outputIndexes": [ 4794 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4794 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4795 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4795 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3632 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3535, 3632 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/Add_output_0", "outputIndexes": [ 3633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3633 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4007830578, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.33/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3634 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3634 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4796 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4796 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4797 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4797 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4007863346, 25165846, 6291456, 0, 0 ] } , "name": "/layers.33/mlp/gate_proj/Linear", "outputIndexes": [ 4798 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4798 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4799 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4799 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3635 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3635 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.33/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3636 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4797 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4039320648, 25165846, 6291456, 0, 0 ] } , "name": "/layers.33/mlp/up_proj/Linear", "outputIndexes": [ 4802 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4802 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4803 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4803 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3637 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3636, 3637 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/mlp/Mul_output_0", "outputIndexes": [ 3638 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3638 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4804 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4804 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4805 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4805 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4070777950, 25165846, 6291456, 0, 0 ] } , "name": "/layers.33/mlp/down_proj/Linear", "outputIndexes": [ 4806 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4806 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4807 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4807 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3633, 3639 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.33/Add_1_output_0", "outputIndexes": [ 3640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3640, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.34/Reshape_output_0", "outputIndexes": [ 3641 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4102235252, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.34/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3642 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4808 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4808 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4809 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4809 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4102268020, 8388630, 2097152, 0, 0 ] } , "name": "/layers.34/self_attn/q_proj/Linear", "outputIndexes": [ 4810 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4810 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4811 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4811 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3643 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "NONE", "name": "/blocks.34/self_attn/Shape_output_0", "outputIndexes": [ 3644 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3644 ] , "main_type": "NONE", "name": "Shape14395", "outputIndexes": [ 3645 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3644 ] , "main_type": "NONE", "name": "Rank14397", "outputIndexes": [ 3646 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3646, 3646 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14399", "outputIndexes": [ 3647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3647 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14400", "outputIndexes": [ 3648 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3647, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14402", "outputIndexes": [ 3649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3649 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14403", "outputIndexes": [ 3650 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3645, 3648, 3650, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14406", "outputIndexes": [ 3651 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3651 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14407", "outputIndexes": [ 3652 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3652, 3652 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14409", "outputIndexes": [ 3653 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3644, 3653, 3647 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_output_0", "outputIndexes": [ 3654 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3647 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14417", "outputIndexes": [ 3656 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3649 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14420", "outputIndexes": [ 3657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3645, 3656, 3657, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14423", "outputIndexes": [ 3658 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3658 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14424", "outputIndexes": [ 3659 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3659 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14425", "outputIndexes": [ 3660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3660, 3659 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14426", "outputIndexes": [ 3661 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3644, 3661, 3647 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_1_output_0", "outputIndexes": [ 3662 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3662, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3663 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3655, 3663, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.34/self_attn/Concat_output_0", "outputIndexes": [ 3664 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3643, 3664 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.34/self_attn/Reshape_output_0", "outputIndexes": [ 3665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3665 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4112753802, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.34/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3667 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14444", "outputIndexes": [ 3668 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14447", "outputIndexes": [ 3669 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3668, 3669, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14450", "outputIndexes": [ 3670 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3670 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14451", "outputIndexes": [ 3671 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3671, 3671 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14453", "outputIndexes": [ 3672 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3672, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_2_output_0", "outputIndexes": [ 3673 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667, 3673 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Mul_output_0", "outputIndexes": [ 3674 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667 ] , "main_type": "NONE", "name": "/blocks.34/self_attn/Shape_2_output_0", "outputIndexes": [ 3675 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3675 ] , "main_type": "NONE", "name": "Shape14577", "outputIndexes": [ 3676 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3675 ] , "main_type": "NONE", "name": "Rank14579", "outputIndexes": [ 3677 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3677, 3677 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14581", "outputIndexes": [ 3678 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3678 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14582", "outputIndexes": [ 3679 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3678, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14584", "outputIndexes": [ 3680 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3680 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14585", "outputIndexes": [ 3681 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3676, 3679, 3681, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14588", "outputIndexes": [ 3682 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14589", "outputIndexes": [ 3683 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3683 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14590", "outputIndexes": [ 3684 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3684, 3683 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14591", "outputIndexes": [ 3685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3675, 3685, 3678 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_4_output_0", "outputIndexes": [ 3686 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3686, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Div_output_0", "outputIndexes": [ 3687 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3687, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3688 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667, 3688, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.34/self_attn/Slice_1_output_0", "outputIndexes": [ 3689 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3689 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.34/self_attn/Neg_output_0", "outputIndexes": [ 3690 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3687, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3691 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667, 22, 3691, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.34/self_attn/Slice_output_0", "outputIndexes": [ 3692 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3690, 3692 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.34/self_attn/Concat_3_output_0", "outputIndexes": [ 3693 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14486", "outputIndexes": [ 3694 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14489", "outputIndexes": [ 3695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3694, 3695, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14492", "outputIndexes": [ 3696 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3696 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14493", "outputIndexes": [ 3697 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3697 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14494", "outputIndexes": [ 3698 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3698, 3697 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14495", "outputIndexes": [ 3699 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3699, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_3_output_0", "outputIndexes": [ 3700 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3693, 3700 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Mul_1_output_0", "outputIndexes": [ 3701 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3674, 3701 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Add_output_0", "outputIndexes": [ 3702 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4809 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4112754826, 2097174, 524288, 0, 0 ] } , "name": "/layers.34/self_attn/k_proj/Linear", "outputIndexes": [ 4814 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4814 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4815 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4815 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3703 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3704 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3662, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3705 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3704, 3705, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.34/self_attn/Concat_1_output_0", "outputIndexes": [ 3706 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3703, 3706 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.34/self_attn/Reshape_1_output_0", "outputIndexes": [ 3707 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3707 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4115376288, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.34/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3709 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709, 3673 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Mul_2_output_0", "outputIndexes": [ 3710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "NONE", "name": "/blocks.34/self_attn/Shape_3_output_0", "outputIndexes": [ 3711 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3711 ] , "main_type": "NONE", "name": "Shape14457", "outputIndexes": [ 3712 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3711 ] , "main_type": "NONE", "name": "Rank14459", "outputIndexes": [ 3713 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3713, 3713 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14461", "outputIndexes": [ 3714 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3714 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14462", "outputIndexes": [ 3715 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3714, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14464", "outputIndexes": [ 3716 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3716 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14465", "outputIndexes": [ 3717 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3712, 3715, 3717, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14468", "outputIndexes": [ 3718 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3718 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14469", "outputIndexes": [ 3719 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3719 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14470", "outputIndexes": [ 3720 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3720, 3719 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14471", "outputIndexes": [ 3721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3711, 3721, 3714 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.34/self_attn/Gather_5_output_0", "outputIndexes": [ 3722 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3722, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Div_1_output_0", "outputIndexes": [ 3723 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3723, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3724 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709, 3724, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.34/self_attn/Slice_3_output_0", "outputIndexes": [ 3725 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3725 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.34/self_attn/Neg_1_output_0", "outputIndexes": [ 3726 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3723, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709, 22, 3727, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.34/self_attn/Slice_2_output_0", "outputIndexes": [ 3728 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3726, 3728 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.34/self_attn/Concat_4_output_0", "outputIndexes": [ 3729 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3729, 3700 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Mul_3_output_0", "outputIndexes": [ 3730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710, 3730 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/self_attn/Add_1_output_0", "outputIndexes": [ 3731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4809 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4115377312, 2097174, 524288, 0, 0 ] } , "name": "/layers.34/self_attn/v_proj/Linear", "outputIndexes": [ 4818 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4818 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4819 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4819 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3732 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3733 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3662, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.34/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3734 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3733, 3734, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.34/self_attn/Concat_2_output_0", "outputIndexes": [ 3735 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3732, 3735 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.34/self_attn/Reshape_2_output_0", "outputIndexes": [ 3736 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3702, 3731, 3736, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.34/self_attn/Reshape_7_output_0", "outputIndexes": [ 3737 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4820 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4820 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4821 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4821 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4117998774, 8388630, 2097152, 0, 0 ] } , "name": "/layers.34/self_attn/o_proj/Linear", "outputIndexes": [ 4822 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4822 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4823 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4823 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3738 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641, 3738 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/Add_output_0", "outputIndexes": [ 3739 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3739 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4128484556, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.34/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3740 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3740 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4824 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4824 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4825 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4825 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4128517324, 25165846, 6291456, 0, 0 ] } , "name": "/layers.34/mlp/gate_proj/Linear", "outputIndexes": [ 4826 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4826 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4827 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4827 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3741 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3741 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.34/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3742 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4825 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4159974626, 25165846, 6291456, 0, 0 ] } , "name": "/layers.34/mlp/up_proj/Linear", "outputIndexes": [ 4830 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4830 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4831 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4831 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3743 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3742, 3743 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/mlp/Mul_output_0", "outputIndexes": [ 3744 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3744 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4832 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4832 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4833 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4833 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4191431928, 25165846, 6291456, 0, 0 ] } , "name": "/layers.34/mlp/down_proj/Linear", "outputIndexes": [ 4834 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4834 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4835 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4835 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3745 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3739, 3745 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.34/Add_1_output_0", "outputIndexes": [ 3746 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3746, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.35/Reshape_output_0", "outputIndexes": [ 3747 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3747 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4222889230, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.35/input_layernorm/Mul_1_output_0", "outputIndexes": [ 3748 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3748 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4836 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4836 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4837 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4837 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4222921998, 8388630, 2097152, 0, 0 ] } , "name": "/layers.35/self_attn/q_proj/Linear", "outputIndexes": [ 4838 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4838 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4839 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4839 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3748 ] , "main_type": "NONE", "name": "/blocks.35/self_attn/Shape_output_0", "outputIndexes": [ 3750 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3750 ] , "main_type": "NONE", "name": "Shape14816", "outputIndexes": [ 3751 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3750 ] , "main_type": "NONE", "name": "Rank14818", "outputIndexes": [ 3752 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3752, 3752 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14820", "outputIndexes": [ 3753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14821", "outputIndexes": [ 3754 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14823", "outputIndexes": [ 3755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3755 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14824", "outputIndexes": [ 3756 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3751, 3754, 3756, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14827", "outputIndexes": [ 3757 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3757 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14828", "outputIndexes": [ 3758 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3758, 3758 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14830", "outputIndexes": [ 3759 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3750, 3759, 3753 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_output_0", "outputIndexes": [ 3760 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_output_0", "outputIndexes": [ 3761 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14838", "outputIndexes": [ 3762 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3755 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14841", "outputIndexes": [ 3763 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3751, 3762, 3763, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14844", "outputIndexes": [ 3764 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3764 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14845", "outputIndexes": [ 3765 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3765 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14846", "outputIndexes": [ 3766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766, 3765 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14847", "outputIndexes": [ 3767 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3750, 3767, 3753 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_1_output_0", "outputIndexes": [ 3768 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 3769 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3761, 3769, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.35/self_attn/Concat_output_0", "outputIndexes": [ 3770 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3749, 3770 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.35/self_attn/Reshape_output_0", "outputIndexes": [ 3771 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3771 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4233407780, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.35/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 3773 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14865", "outputIndexes": [ 3774 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14868", "outputIndexes": [ 3775 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3774, 3775, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14871", "outputIndexes": [ 3776 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3776 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14872", "outputIndexes": [ 3777 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3777, 3777 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14874", "outputIndexes": [ 3778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3778, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_2_output_0", "outputIndexes": [ 3779 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3773, 3779 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Mul_output_0", "outputIndexes": [ 3780 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3773 ] , "main_type": "NONE", "name": "/blocks.35/self_attn/Shape_2_output_0", "outputIndexes": [ 3781 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3781 ] , "main_type": "NONE", "name": "Shape14966", "outputIndexes": [ 3782 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3781 ] , "main_type": "NONE", "name": "Rank14968", "outputIndexes": [ 3783 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3783, 3783 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14970", "outputIndexes": [ 3784 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3784 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14971", "outputIndexes": [ 3785 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3784, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14973", "outputIndexes": [ 3786 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3786 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14974", "outputIndexes": [ 3787 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3782, 3785, 3787, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14977", "outputIndexes": [ 3788 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3788 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14978", "outputIndexes": [ 3789 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3789 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14979", "outputIndexes": [ 3790 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3790, 3789 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14980", "outputIndexes": [ 3791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3781, 3791, 3784 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_4_output_0", "outputIndexes": [ 3792 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3792, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Div_output_0", "outputIndexes": [ 3793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 3794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3773, 3794, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.35/self_attn/Slice_1_output_0", "outputIndexes": [ 3795 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3795 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.35/self_attn/Neg_output_0", "outputIndexes": [ 3796 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 3797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3773, 22, 3797, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.35/self_attn/Slice_output_0", "outputIndexes": [ 3798 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3796, 3798 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.35/self_attn/Concat_3_output_0", "outputIndexes": [ 3799 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14907", "outputIndexes": [ 3800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14910", "outputIndexes": [ 3801 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54, 3800, 3801, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14913", "outputIndexes": [ 3802 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3802 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14914", "outputIndexes": [ 3803 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3803 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14915", "outputIndexes": [ 3804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3804, 3803 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14916", "outputIndexes": [ 3805 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53, 3805, 56 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_3_output_0", "outputIndexes": [ 3806 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3799, 3806 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Mul_1_output_0", "outputIndexes": [ 3807 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3780, 3807 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Add_output_0", "outputIndexes": [ 3808 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4837 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4233408804, 2097174, 524288, 0, 0 ] } , "name": "/layers.35/self_attn/k_proj/Linear", "outputIndexes": [ 4842 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4842 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4843 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4843 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 3810 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 3811 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3810, 3811, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.35/self_attn/Concat_1_output_0", "outputIndexes": [ 3812 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3809, 3812 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.35/self_attn/Reshape_1_output_0", "outputIndexes": [ 3813 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3813 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4236030266, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.35/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 3815 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3815, 3779 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Mul_2_output_0", "outputIndexes": [ 3816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3815 ] , "main_type": "NONE", "name": "/blocks.35/self_attn/Shape_3_output_0", "outputIndexes": [ 3817 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3817 ] , "main_type": "NONE", "name": "Shape14878", "outputIndexes": [ 3818 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3817 ] , "main_type": "NONE", "name": "Rank14880", "outputIndexes": [ 3819 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3819, 3819 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14882", "outputIndexes": [ 3820 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3820 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14883", "outputIndexes": [ 3821 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3820, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14885", "outputIndexes": [ 3822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3822 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze14886", "outputIndexes": [ 3823 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3818, 3821, 3823, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice14889", "outputIndexes": [ 3824 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3824 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze14890", "outputIndexes": [ 3825 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66, 3825 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14891", "outputIndexes": [ 3826 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3826, 3825 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp14892", "outputIndexes": [ 3827 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3817, 3827, 3820 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.35/self_attn/Gather_5_output_0", "outputIndexes": [ 3828 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3828, 78 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Div_1_output_0", "outputIndexes": [ 3829 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3829, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 3830 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3815, 3830, 81, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.35/self_attn/Slice_3_output_0", "outputIndexes": [ 3831 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3831 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.35/self_attn/Neg_1_output_0", "outputIndexes": [ 3832 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3829, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 3833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3815, 22, 3833, 82, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.35/self_attn/Slice_2_output_0", "outputIndexes": [ 3834 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3832, 3834 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.35/self_attn/Concat_4_output_0", "outputIndexes": [ 3835 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3835, 3806 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Mul_3_output_0", "outputIndexes": [ 3836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3816, 3836 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/self_attn/Add_1_output_0", "outputIndexes": [ 3837 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4837 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 65536, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4236031290, 2097174, 524288, 0, 0 ] } , "name": "/layers.35/self_attn/v_proj/Linear", "outputIndexes": [ 4846 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4846 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4847 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4847 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3838 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3760, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 3839 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.35/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 3840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3839, 3840, 100, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.35/self_attn/Concat_2_output_0", "outputIndexes": [ 3841 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3838, 3841 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.35/self_attn/Reshape_2_output_0", "outputIndexes": [ 3842 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3808, 3837, 3842, 132 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/blocks.35/self_attn/Reshape_7_output_0", "outputIndexes": [ 3843 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3843 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4848 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4848 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4849 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4849 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 262144, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4238652752, 8388630, 2097152, 0, 0 ] } , "name": "/layers.35/self_attn/o_proj/Linear", "outputIndexes": [ 4850 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4850 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4851 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4851 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3844 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3747, 3844 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/Add_output_0", "outputIndexes": [ 3845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3845 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4249138534, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.35/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 3846 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3846 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4852 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4852 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4853 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4853 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4249171302, 25165846, 6291456, 0, 0 ] } , "name": "/layers.35/mlp/gate_proj/Linear", "outputIndexes": [ 4854 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4854 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4855 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4855 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3847 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3847 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.35/mlp/act_fn/Mul_output_0", "outputIndexes": [ 3848 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4853 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 12288, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4280628604, 25165846, 6291456, 0, 0 ] } , "name": "/layers.35/mlp/up_proj/Linear", "outputIndexes": [ 4858 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4858 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4859 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4859 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 12288 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3848, 3849 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/mlp/Mul_output_0", "outputIndexes": [ 3850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3850 ] , "main_type": "Reshape", "main": { "dims": [ -1, 12288, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4860 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4860 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4861 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4861 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 12288, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 786432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4312085906, 25165846, 6291456, 0, 0 ] } , "name": "/layers.35/mlp/down_proj/Linear", "outputIndexes": [ 4862 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4862 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4863 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4863 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3851 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3845, 3851 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.35/Add_1_output_0", "outputIndexes": [ 3852 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3852, 3, 81, 17, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 3853 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3853 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 4343543208, 16384, 16384 ] , "useRMSNorm": true } , "name": "hidden_states", "outputIndexes": [ 3854 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3854 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 4864 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4864 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 4865 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4865 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 151936, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 9723904, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 4343575976, 311164954, 77791232, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 4866 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4866 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 4867 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4867 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 151936 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 3855 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "hidden_states", "presents" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "past_key_values", "presents", "position_ids", "logits_index", "input_ids", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape52", "Rank54", "BinaryOp56", "Unsqueeze57", "Const9", "BinaryOp59", "Unsqueeze60", "Unsqueeze62", "StridedSlice63", "Squeeze64", "BinaryOp66", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_4_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze76", "Unsqueeze79", "StridedSlice82", "Squeeze83", "BinaryOp84", "BinaryOp85", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/blocks.0/self_attn/q_norm/Cast_output_0", "/blocks.0/self_attn/q_norm/Mul_1_output_0", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_2_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_7_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "/rotary/Constant_10_output_0", "/rotary/Mul_1_output_0", "Shape118", "Rank120", "BinaryOp122", "Unsqueeze123", "BinaryOp125", "Unsqueeze126", "StridedSlice129", "Squeeze130", "BinaryOp132", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_10_output_0", "Shape260", "Rank262", "BinaryOp264", "Unsqueeze265", "BinaryOp267", "Unsqueeze268", "StridedSlice271", "Squeeze272", "BinaryOp273", "BinaryOp274", "/blocks.0/self_attn/Gather_4_output_0", "/rotary/Constant_6_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_19_output_0", "/blocks.0/self_attn/Constant_13_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze169", "Unsqueeze172", "StridedSlice175", "Squeeze176", "BinaryOp177", "BinaryOp178", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Constant_6_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/k_norm/Cast_output_0", "/blocks.0/self_attn/k_norm/Mul_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape137", "Rank139", "BinaryOp141", "Unsqueeze142", "BinaryOp144", "Unsqueeze145", "StridedSlice148", "Squeeze149", "BinaryOp150", "BinaryOp151", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "/blocks.0/self_attn/Reshape_7_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/Add_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape505", "Rank507", "BinaryOp509", "Unsqueeze510", "BinaryOp512", "Unsqueeze513", "StridedSlice516", "Squeeze517", "BinaryOp519", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze527", "Unsqueeze530", "StridedSlice533", "Squeeze534", "BinaryOp535", "BinaryOp536", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/q_norm/Cast_output_0", "/blocks.1/self_attn/q_norm/Mul_1_output_0", "Unsqueeze554", "Unsqueeze557", "StridedSlice560", "Squeeze561", "BinaryOp563", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape686", "Rank688", "BinaryOp690", "Unsqueeze691", "BinaryOp693", "Unsqueeze694", "StridedSlice697", "Squeeze698", "BinaryOp699", "BinaryOp700", "/blocks.1/self_attn/Gather_4_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "Unsqueeze596", "Unsqueeze599", "StridedSlice602", "Squeeze603", "BinaryOp604", "BinaryOp605", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/k_norm/Cast_output_0", "/blocks.1/self_attn/k_norm/Mul_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape567", "Rank569", "BinaryOp571", "Unsqueeze572", "BinaryOp574", "Unsqueeze575", "StridedSlice578", "Squeeze579", "BinaryOp580", "BinaryOp581", "/blocks.1/self_attn/Gather_5_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "/blocks.1/self_attn/Reshape_7_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/Add_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape925", "Rank927", "BinaryOp929", "Unsqueeze930", "BinaryOp932", "Unsqueeze933", "StridedSlice936", "Squeeze937", "BinaryOp939", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze947", "Unsqueeze950", "StridedSlice953", "Squeeze954", "BinaryOp955", "BinaryOp956", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/q_norm/Cast_output_0", "/blocks.2/self_attn/q_norm/Mul_1_output_0", "Unsqueeze974", "Unsqueeze977", "StridedSlice980", "Squeeze981", "BinaryOp983", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape1106", "Rank1108", "BinaryOp1110", "Unsqueeze1111", "BinaryOp1113", "Unsqueeze1114", "StridedSlice1117", "Squeeze1118", "BinaryOp1119", "BinaryOp1120", "/blocks.2/self_attn/Gather_4_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "Unsqueeze1016", "Unsqueeze1019", "StridedSlice1022", "Squeeze1023", "BinaryOp1024", "BinaryOp1025", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/k_norm/Cast_output_0", "/blocks.2/self_attn/k_norm/Mul_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape987", "Rank989", "BinaryOp991", "Unsqueeze992", "BinaryOp994", "Unsqueeze995", "StridedSlice998", "Squeeze999", "BinaryOp1000", "BinaryOp1001", "/blocks.2/self_attn/Gather_5_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "/blocks.2/self_attn/Reshape_7_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/Add_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape1345", "Rank1347", "BinaryOp1349", "Unsqueeze1350", "BinaryOp1352", "Unsqueeze1353", "StridedSlice1356", "Squeeze1357", "BinaryOp1359", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze1367", "Unsqueeze1370", "StridedSlice1373", "Squeeze1374", "BinaryOp1375", "BinaryOp1376", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/q_norm/Cast_output_0", "/blocks.3/self_attn/q_norm/Mul_1_output_0", "Unsqueeze1394", "Unsqueeze1397", "StridedSlice1400", "Squeeze1401", "BinaryOp1403", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape1526", "Rank1528", "BinaryOp1530", "Unsqueeze1531", "BinaryOp1533", "Unsqueeze1534", "StridedSlice1537", "Squeeze1538", "BinaryOp1539", "BinaryOp1540", "/blocks.3/self_attn/Gather_4_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "Unsqueeze1436", "Unsqueeze1439", "StridedSlice1442", "Squeeze1443", "BinaryOp1444", "BinaryOp1445", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/k_norm/Cast_output_0", "/blocks.3/self_attn/k_norm/Mul_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape1407", "Rank1409", "BinaryOp1411", "Unsqueeze1412", "BinaryOp1414", "Unsqueeze1415", "StridedSlice1418", "Squeeze1419", "BinaryOp1420", "BinaryOp1421", "/blocks.3/self_attn/Gather_5_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "/blocks.3/self_attn/Reshape_7_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/Add_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape1765", "Rank1767", "BinaryOp1769", "Unsqueeze1770", "BinaryOp1772", "Unsqueeze1773", "StridedSlice1776", "Squeeze1777", "BinaryOp1779", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze1787", "Unsqueeze1790", "StridedSlice1793", "Squeeze1794", "BinaryOp1795", "BinaryOp1796", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/q_norm/Cast_output_0", "/blocks.4/self_attn/q_norm/Mul_1_output_0", "Unsqueeze1814", "Unsqueeze1817", "StridedSlice1820", "Squeeze1821", "BinaryOp1823", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape1947", "Rank1949", "BinaryOp1951", "Unsqueeze1952", "BinaryOp1954", "Unsqueeze1955", "StridedSlice1958", "Squeeze1959", "BinaryOp1960", "BinaryOp1961", "/blocks.4/self_attn/Gather_4_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "Unsqueeze1856", "Unsqueeze1859", "StridedSlice1862", "Squeeze1863", "BinaryOp1864", "BinaryOp1865", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/k_norm/Cast_output_0", "/blocks.4/self_attn/k_norm/Mul_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape1827", "Rank1829", "BinaryOp1831", "Unsqueeze1832", "BinaryOp1834", "Unsqueeze1835", "StridedSlice1838", "Squeeze1839", "BinaryOp1840", "BinaryOp1841", "/blocks.4/self_attn/Gather_5_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "/blocks.4/self_attn/Reshape_7_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/Add_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape2186", "Rank2188", "BinaryOp2190", "Unsqueeze2191", "BinaryOp2193", "Unsqueeze2194", "StridedSlice2197", "Squeeze2198", "BinaryOp2200", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze2208", "Unsqueeze2211", "StridedSlice2214", "Squeeze2215", "BinaryOp2216", "BinaryOp2217", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/q_norm/Cast_output_0", "/blocks.5/self_attn/q_norm/Mul_1_output_0", "Unsqueeze2235", "Unsqueeze2238", "StridedSlice2241", "Squeeze2242", "BinaryOp2244", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape2368", "Rank2370", "BinaryOp2372", "Unsqueeze2373", "BinaryOp2375", "Unsqueeze2376", "StridedSlice2379", "Squeeze2380", "BinaryOp2381", "BinaryOp2382", "/blocks.5/self_attn/Gather_4_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "Unsqueeze2277", "Unsqueeze2280", "StridedSlice2283", "Squeeze2284", "BinaryOp2285", "BinaryOp2286", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/k_norm/Cast_output_0", "/blocks.5/self_attn/k_norm/Mul_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape2248", "Rank2250", "BinaryOp2252", "Unsqueeze2253", "BinaryOp2255", "Unsqueeze2256", "StridedSlice2259", "Squeeze2260", "BinaryOp2261", "BinaryOp2262", "/blocks.5/self_attn/Gather_5_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "/blocks.5/self_attn/Reshape_7_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/Add_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape2607", "Rank2609", "BinaryOp2611", "Unsqueeze2612", "BinaryOp2614", "Unsqueeze2615", "StridedSlice2618", "Squeeze2619", "BinaryOp2621", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze2629", "Unsqueeze2632", "StridedSlice2635", "Squeeze2636", "BinaryOp2637", "BinaryOp2638", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/q_norm/Cast_output_0", "/blocks.6/self_attn/q_norm/Mul_1_output_0", "Unsqueeze2656", "Unsqueeze2659", "StridedSlice2662", "Squeeze2663", "BinaryOp2665", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape2789", "Rank2791", "BinaryOp2793", "Unsqueeze2794", "BinaryOp2796", "Unsqueeze2797", "StridedSlice2800", "Squeeze2801", "BinaryOp2802", "BinaryOp2803", "/blocks.6/self_attn/Gather_4_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "Unsqueeze2698", "Unsqueeze2701", "StridedSlice2704", "Squeeze2705", "BinaryOp2706", "BinaryOp2707", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/k_norm/Cast_output_0", "/blocks.6/self_attn/k_norm/Mul_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape2669", "Rank2671", "BinaryOp2673", "Unsqueeze2674", "BinaryOp2676", "Unsqueeze2677", "StridedSlice2680", "Squeeze2681", "BinaryOp2682", "BinaryOp2683", "/blocks.6/self_attn/Gather_5_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "/blocks.6/self_attn/Reshape_7_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/Add_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape3028", "Rank3030", "BinaryOp3032", "Unsqueeze3033", "BinaryOp3035", "Unsqueeze3036", "StridedSlice3039", "Squeeze3040", "BinaryOp3042", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze3050", "Unsqueeze3053", "StridedSlice3056", "Squeeze3057", "BinaryOp3058", "BinaryOp3059", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/q_norm/Cast_output_0", "/blocks.7/self_attn/q_norm/Mul_1_output_0", "Unsqueeze3077", "Unsqueeze3080", "StridedSlice3083", "Squeeze3084", "BinaryOp3086", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape3210", "Rank3212", "BinaryOp3214", "Unsqueeze3215", "BinaryOp3217", "Unsqueeze3218", "StridedSlice3221", "Squeeze3222", "BinaryOp3223", "BinaryOp3224", "/blocks.7/self_attn/Gather_4_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "Unsqueeze3119", "Unsqueeze3122", "StridedSlice3125", "Squeeze3126", "BinaryOp3127", "BinaryOp3128", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/k_norm/Cast_output_0", "/blocks.7/self_attn/k_norm/Mul_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape3090", "Rank3092", "BinaryOp3094", "Unsqueeze3095", "BinaryOp3097", "Unsqueeze3098", "StridedSlice3101", "Squeeze3102", "BinaryOp3103", "BinaryOp3104", "/blocks.7/self_attn/Gather_5_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "/blocks.7/self_attn/Reshape_7_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/Add_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape3449", "Rank3451", "BinaryOp3453", "Unsqueeze3454", "BinaryOp3456", "Unsqueeze3457", "StridedSlice3460", "Squeeze3461", "BinaryOp3463", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze3471", "Unsqueeze3474", "StridedSlice3477", "Squeeze3478", "BinaryOp3479", "BinaryOp3480", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/q_norm/Cast_output_0", "/blocks.8/self_attn/q_norm/Mul_1_output_0", "Unsqueeze3498", "Unsqueeze3501", "StridedSlice3504", "Squeeze3505", "BinaryOp3507", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape3631", "Rank3633", "BinaryOp3635", "Unsqueeze3636", "BinaryOp3638", "Unsqueeze3639", "StridedSlice3642", "Squeeze3643", "BinaryOp3644", "BinaryOp3645", "/blocks.8/self_attn/Gather_4_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "Unsqueeze3540", "Unsqueeze3543", "StridedSlice3546", "Squeeze3547", "BinaryOp3548", "BinaryOp3549", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/k_norm/Cast_output_0", "/blocks.8/self_attn/k_norm/Mul_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape3511", "Rank3513", "BinaryOp3515", "Unsqueeze3516", "BinaryOp3518", "Unsqueeze3519", "StridedSlice3522", "Squeeze3523", "BinaryOp3524", "BinaryOp3525", "/blocks.8/self_attn/Gather_5_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "/blocks.8/self_attn/Reshape_7_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/Add_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape3870", "Rank3872", "BinaryOp3874", "Unsqueeze3875", "BinaryOp3877", "Unsqueeze3878", "StridedSlice3881", "Squeeze3882", "BinaryOp3884", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze3892", "Unsqueeze3895", "StridedSlice3898", "Squeeze3899", "BinaryOp3900", "BinaryOp3901", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/q_norm/Cast_output_0", "/blocks.9/self_attn/q_norm/Mul_1_output_0", "Unsqueeze3919", "Unsqueeze3922", "StridedSlice3925", "Squeeze3926", "BinaryOp3928", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape4052", "Rank4054", "BinaryOp4056", "Unsqueeze4057", "BinaryOp4059", "Unsqueeze4060", "StridedSlice4063", "Squeeze4064", "BinaryOp4065", "BinaryOp4066", "/blocks.9/self_attn/Gather_4_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "Unsqueeze3961", "Unsqueeze3964", "StridedSlice3967", "Squeeze3968", "BinaryOp3969", "BinaryOp3970", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/k_norm/Cast_output_0", "/blocks.9/self_attn/k_norm/Mul_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape3932", "Rank3934", "BinaryOp3936", "Unsqueeze3937", "BinaryOp3939", "Unsqueeze3940", "StridedSlice3943", "Squeeze3944", "BinaryOp3945", "BinaryOp3946", "/blocks.9/self_attn/Gather_5_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "/blocks.9/self_attn/Reshape_7_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/Add_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape4291", "Rank4293", "BinaryOp4295", "Unsqueeze4296", "BinaryOp4298", "Unsqueeze4299", "StridedSlice4302", "Squeeze4303", "BinaryOp4305", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze4313", "Unsqueeze4316", "StridedSlice4319", "Squeeze4320", "BinaryOp4321", "BinaryOp4322", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/q_norm/Cast_output_0", "/blocks.10/self_attn/q_norm/Mul_1_output_0", "Unsqueeze4340", "Unsqueeze4343", "StridedSlice4346", "Squeeze4347", "BinaryOp4349", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape4473", "Rank4475", "BinaryOp4477", "Unsqueeze4478", "BinaryOp4480", "Unsqueeze4481", "StridedSlice4484", "Squeeze4485", "BinaryOp4486", "BinaryOp4487", "/blocks.10/self_attn/Gather_4_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "Unsqueeze4382", "Unsqueeze4385", "StridedSlice4388", "Squeeze4389", "BinaryOp4390", "BinaryOp4391", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/k_norm/Cast_output_0", "/blocks.10/self_attn/k_norm/Mul_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape4353", "Rank4355", "BinaryOp4357", "Unsqueeze4358", "BinaryOp4360", "Unsqueeze4361", "StridedSlice4364", "Squeeze4365", "BinaryOp4366", "BinaryOp4367", "/blocks.10/self_attn/Gather_5_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "/blocks.10/self_attn/Reshape_7_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/Add_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape4712", "Rank4714", "BinaryOp4716", "Unsqueeze4717", "BinaryOp4719", "Unsqueeze4720", "StridedSlice4723", "Squeeze4724", "BinaryOp4726", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze4734", "Unsqueeze4737", "StridedSlice4740", "Squeeze4741", "BinaryOp4742", "BinaryOp4743", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/q_norm/Cast_output_0", "/blocks.11/self_attn/q_norm/Mul_1_output_0", "Unsqueeze4761", "Unsqueeze4764", "StridedSlice4767", "Squeeze4768", "BinaryOp4770", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape4894", "Rank4896", "BinaryOp4898", "Unsqueeze4899", "BinaryOp4901", "Unsqueeze4902", "StridedSlice4905", "Squeeze4906", "BinaryOp4907", "BinaryOp4908", "/blocks.11/self_attn/Gather_4_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "Unsqueeze4803", "Unsqueeze4806", "StridedSlice4809", "Squeeze4810", "BinaryOp4811", "BinaryOp4812", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/k_norm/Cast_output_0", "/blocks.11/self_attn/k_norm/Mul_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape4774", "Rank4776", "BinaryOp4778", "Unsqueeze4779", "BinaryOp4781", "Unsqueeze4782", "StridedSlice4785", "Squeeze4786", "BinaryOp4787", "BinaryOp4788", "/blocks.11/self_attn/Gather_5_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "/blocks.11/self_attn/Reshape_7_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/Add_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape5133", "Rank5135", "BinaryOp5137", "Unsqueeze5138", "BinaryOp5140", "Unsqueeze5141", "StridedSlice5144", "Squeeze5145", "BinaryOp5147", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze5155", "Unsqueeze5158", "StridedSlice5161", "Squeeze5162", "BinaryOp5163", "BinaryOp5164", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/q_norm/Cast_output_0", "/blocks.12/self_attn/q_norm/Mul_1_output_0", "Unsqueeze5182", "Unsqueeze5185", "StridedSlice5188", "Squeeze5189", "BinaryOp5191", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape5315", "Rank5317", "BinaryOp5319", "Unsqueeze5320", "BinaryOp5322", "Unsqueeze5323", "StridedSlice5326", "Squeeze5327", "BinaryOp5328", "BinaryOp5329", "/blocks.12/self_attn/Gather_4_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "Unsqueeze5224", "Unsqueeze5227", "StridedSlice5230", "Squeeze5231", "BinaryOp5232", "BinaryOp5233", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/k_norm/Cast_output_0", "/blocks.12/self_attn/k_norm/Mul_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape5195", "Rank5197", "BinaryOp5199", "Unsqueeze5200", "BinaryOp5202", "Unsqueeze5203", "StridedSlice5206", "Squeeze5207", "BinaryOp5208", "BinaryOp5209", "/blocks.12/self_attn/Gather_5_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "/blocks.12/self_attn/Reshape_7_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/Add_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape5554", "Rank5556", "BinaryOp5558", "Unsqueeze5559", "BinaryOp5561", "Unsqueeze5562", "StridedSlice5565", "Squeeze5566", "BinaryOp5568", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze5576", "Unsqueeze5579", "StridedSlice5582", "Squeeze5583", "BinaryOp5584", "BinaryOp5585", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/q_norm/Cast_output_0", "/blocks.13/self_attn/q_norm/Mul_1_output_0", "Unsqueeze5603", "Unsqueeze5606", "StridedSlice5609", "Squeeze5610", "BinaryOp5612", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape5736", "Rank5738", "BinaryOp5740", "Unsqueeze5741", "BinaryOp5743", "Unsqueeze5744", "StridedSlice5747", "Squeeze5748", "BinaryOp5749", "BinaryOp5750", "/blocks.13/self_attn/Gather_4_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "Unsqueeze5645", "Unsqueeze5648", "StridedSlice5651", "Squeeze5652", "BinaryOp5653", "BinaryOp5654", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/k_norm/Cast_output_0", "/blocks.13/self_attn/k_norm/Mul_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape5616", "Rank5618", "BinaryOp5620", "Unsqueeze5621", "BinaryOp5623", "Unsqueeze5624", "StridedSlice5627", "Squeeze5628", "BinaryOp5629", "BinaryOp5630", "/blocks.13/self_attn/Gather_5_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "/blocks.13/self_attn/Reshape_7_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/Add_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape5975", "Rank5977", "BinaryOp5979", "Unsqueeze5980", "BinaryOp5982", "Unsqueeze5983", "StridedSlice5986", "Squeeze5987", "BinaryOp5989", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze5997", "Unsqueeze6000", "StridedSlice6003", "Squeeze6004", "BinaryOp6005", "BinaryOp6006", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/q_norm/Cast_output_0", "/blocks.14/self_attn/q_norm/Mul_1_output_0", "Unsqueeze6024", "Unsqueeze6027", "StridedSlice6030", "Squeeze6031", "BinaryOp6033", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape6157", "Rank6159", "BinaryOp6161", "Unsqueeze6162", "BinaryOp6164", "Unsqueeze6165", "StridedSlice6168", "Squeeze6169", "BinaryOp6170", "BinaryOp6171", "/blocks.14/self_attn/Gather_4_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "Unsqueeze6066", "Unsqueeze6069", "StridedSlice6072", "Squeeze6073", "BinaryOp6074", "BinaryOp6075", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/k_norm/Cast_output_0", "/blocks.14/self_attn/k_norm/Mul_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape6037", "Rank6039", "BinaryOp6041", "Unsqueeze6042", "BinaryOp6044", "Unsqueeze6045", "StridedSlice6048", "Squeeze6049", "BinaryOp6050", "BinaryOp6051", "/blocks.14/self_attn/Gather_5_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "/blocks.14/self_attn/Reshape_7_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/Add_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape6396", "Rank6398", "BinaryOp6400", "Unsqueeze6401", "BinaryOp6403", "Unsqueeze6404", "StridedSlice6407", "Squeeze6408", "BinaryOp6410", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze6418", "Unsqueeze6421", "StridedSlice6424", "Squeeze6425", "BinaryOp6426", "BinaryOp6427", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/q_norm/Cast_output_0", "/blocks.15/self_attn/q_norm/Mul_1_output_0", "Unsqueeze6445", "Unsqueeze6448", "StridedSlice6451", "Squeeze6452", "BinaryOp6454", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape6578", "Rank6580", "BinaryOp6582", "Unsqueeze6583", "BinaryOp6585", "Unsqueeze6586", "StridedSlice6589", "Squeeze6590", "BinaryOp6591", "BinaryOp6592", "/blocks.15/self_attn/Gather_4_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "Unsqueeze6487", "Unsqueeze6490", "StridedSlice6493", "Squeeze6494", "BinaryOp6495", "BinaryOp6496", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/k_norm/Cast_output_0", "/blocks.15/self_attn/k_norm/Mul_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape6458", "Rank6460", "BinaryOp6462", "Unsqueeze6463", "BinaryOp6465", "Unsqueeze6466", "StridedSlice6469", "Squeeze6470", "BinaryOp6471", "BinaryOp6472", "/blocks.15/self_attn/Gather_5_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "/blocks.15/self_attn/Reshape_7_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/Add_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape6817", "Rank6819", "BinaryOp6821", "Unsqueeze6822", "BinaryOp6824", "Unsqueeze6825", "StridedSlice6828", "Squeeze6829", "BinaryOp6831", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze6839", "Unsqueeze6842", "StridedSlice6845", "Squeeze6846", "BinaryOp6847", "BinaryOp6848", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/q_norm/Cast_output_0", "/blocks.16/self_attn/q_norm/Mul_1_output_0", "Unsqueeze6866", "Unsqueeze6869", "StridedSlice6872", "Squeeze6873", "BinaryOp6875", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape6999", "Rank7001", "BinaryOp7003", "Unsqueeze7004", "BinaryOp7006", "Unsqueeze7007", "StridedSlice7010", "Squeeze7011", "BinaryOp7012", "BinaryOp7013", "/blocks.16/self_attn/Gather_4_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "Unsqueeze6908", "Unsqueeze6911", "StridedSlice6914", "Squeeze6915", "BinaryOp6916", "BinaryOp6917", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/k_norm/Cast_output_0", "/blocks.16/self_attn/k_norm/Mul_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape6879", "Rank6881", "BinaryOp6883", "Unsqueeze6884", "BinaryOp6886", "Unsqueeze6887", "StridedSlice6890", "Squeeze6891", "BinaryOp6892", "BinaryOp6893", "/blocks.16/self_attn/Gather_5_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "/blocks.16/self_attn/Reshape_7_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/Add_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape7238", "Rank7240", "BinaryOp7242", "Unsqueeze7243", "BinaryOp7245", "Unsqueeze7246", "StridedSlice7249", "Squeeze7250", "BinaryOp7252", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze7260", "Unsqueeze7263", "StridedSlice7266", "Squeeze7267", "BinaryOp7268", "BinaryOp7269", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/q_norm/Cast_output_0", "/blocks.17/self_attn/q_norm/Mul_1_output_0", "Unsqueeze7287", "Unsqueeze7290", "StridedSlice7293", "Squeeze7294", "BinaryOp7296", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape7420", "Rank7422", "BinaryOp7424", "Unsqueeze7425", "BinaryOp7427", "Unsqueeze7428", "StridedSlice7431", "Squeeze7432", "BinaryOp7433", "BinaryOp7434", "/blocks.17/self_attn/Gather_4_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "Unsqueeze7329", "Unsqueeze7332", "StridedSlice7335", "Squeeze7336", "BinaryOp7337", "BinaryOp7338", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/k_norm/Cast_output_0", "/blocks.17/self_attn/k_norm/Mul_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape7300", "Rank7302", "BinaryOp7304", "Unsqueeze7305", "BinaryOp7307", "Unsqueeze7308", "StridedSlice7311", "Squeeze7312", "BinaryOp7313", "BinaryOp7314", "/blocks.17/self_attn/Gather_5_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "/blocks.17/self_attn/Reshape_7_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/Add_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape7659", "Rank7661", "BinaryOp7663", "Unsqueeze7664", "BinaryOp7666", "Unsqueeze7667", "StridedSlice7670", "Squeeze7671", "BinaryOp7673", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze7681", "Unsqueeze7684", "StridedSlice7687", "Squeeze7688", "BinaryOp7689", "BinaryOp7690", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/q_norm/Cast_output_0", "/blocks.18/self_attn/q_norm/Mul_1_output_0", "Unsqueeze7708", "Unsqueeze7711", "StridedSlice7714", "Squeeze7715", "BinaryOp7717", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape7841", "Rank7843", "BinaryOp7845", "Unsqueeze7846", "BinaryOp7848", "Unsqueeze7849", "StridedSlice7852", "Squeeze7853", "BinaryOp7854", "BinaryOp7855", "/blocks.18/self_attn/Gather_4_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "Unsqueeze7750", "Unsqueeze7753", "StridedSlice7756", "Squeeze7757", "BinaryOp7758", "BinaryOp7759", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/k_norm/Cast_output_0", "/blocks.18/self_attn/k_norm/Mul_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape7721", "Rank7723", "BinaryOp7725", "Unsqueeze7726", "BinaryOp7728", "Unsqueeze7729", "StridedSlice7732", "Squeeze7733", "BinaryOp7734", "BinaryOp7735", "/blocks.18/self_attn/Gather_5_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "/blocks.18/self_attn/Reshape_7_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/Add_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape8080", "Rank8082", "BinaryOp8084", "Unsqueeze8085", "BinaryOp8087", "Unsqueeze8088", "StridedSlice8091", "Squeeze8092", "BinaryOp8094", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze8102", "Unsqueeze8105", "StridedSlice8108", "Squeeze8109", "BinaryOp8110", "BinaryOp8111", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/q_norm/Cast_output_0", "/blocks.19/self_attn/q_norm/Mul_1_output_0", "Unsqueeze8129", "Unsqueeze8132", "StridedSlice8135", "Squeeze8136", "BinaryOp8138", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape8262", "Rank8264", "BinaryOp8266", "Unsqueeze8267", "BinaryOp8269", "Unsqueeze8270", "StridedSlice8273", "Squeeze8274", "BinaryOp8275", "BinaryOp8276", "/blocks.19/self_attn/Gather_4_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "Unsqueeze8171", "Unsqueeze8174", "StridedSlice8177", "Squeeze8178", "BinaryOp8179", "BinaryOp8180", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/k_norm/Cast_output_0", "/blocks.19/self_attn/k_norm/Mul_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape8142", "Rank8144", "BinaryOp8146", "Unsqueeze8147", "BinaryOp8149", "Unsqueeze8150", "StridedSlice8153", "Squeeze8154", "BinaryOp8155", "BinaryOp8156", "/blocks.19/self_attn/Gather_5_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "/blocks.19/self_attn/Reshape_7_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/Add_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape8501", "Rank8503", "BinaryOp8505", "Unsqueeze8506", "BinaryOp8508", "Unsqueeze8509", "StridedSlice8512", "Squeeze8513", "BinaryOp8515", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze8523", "Unsqueeze8526", "StridedSlice8529", "Squeeze8530", "BinaryOp8531", "BinaryOp8532", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/q_norm/Cast_output_0", "/blocks.20/self_attn/q_norm/Mul_1_output_0", "Unsqueeze8550", "Unsqueeze8553", "StridedSlice8556", "Squeeze8557", "BinaryOp8559", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape8683", "Rank8685", "BinaryOp8687", "Unsqueeze8688", "BinaryOp8690", "Unsqueeze8691", "StridedSlice8694", "Squeeze8695", "BinaryOp8696", "BinaryOp8697", "/blocks.20/self_attn/Gather_4_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "Unsqueeze8592", "Unsqueeze8595", "StridedSlice8598", "Squeeze8599", "BinaryOp8600", "BinaryOp8601", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/k_norm/Cast_output_0", "/blocks.20/self_attn/k_norm/Mul_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape8563", "Rank8565", "BinaryOp8567", "Unsqueeze8568", "BinaryOp8570", "Unsqueeze8571", "StridedSlice8574", "Squeeze8575", "BinaryOp8576", "BinaryOp8577", "/blocks.20/self_attn/Gather_5_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "/blocks.20/self_attn/Reshape_7_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/Add_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape8922", "Rank8924", "BinaryOp8926", "Unsqueeze8927", "BinaryOp8929", "Unsqueeze8930", "StridedSlice8933", "Squeeze8934", "BinaryOp8936", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze8944", "Unsqueeze8947", "StridedSlice8950", "Squeeze8951", "BinaryOp8952", "BinaryOp8953", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/q_norm/Cast_output_0", "/blocks.21/self_attn/q_norm/Mul_1_output_0", "Unsqueeze8971", "Unsqueeze8974", "StridedSlice8977", "Squeeze8978", "BinaryOp8980", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape9104", "Rank9106", "BinaryOp9108", "Unsqueeze9109", "BinaryOp9111", "Unsqueeze9112", "StridedSlice9115", "Squeeze9116", "BinaryOp9117", "BinaryOp9118", "/blocks.21/self_attn/Gather_4_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "Unsqueeze9013", "Unsqueeze9016", "StridedSlice9019", "Squeeze9020", "BinaryOp9021", "BinaryOp9022", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/k_norm/Cast_output_0", "/blocks.21/self_attn/k_norm/Mul_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape8984", "Rank8986", "BinaryOp8988", "Unsqueeze8989", "BinaryOp8991", "Unsqueeze8992", "StridedSlice8995", "Squeeze8996", "BinaryOp8997", "BinaryOp8998", "/blocks.21/self_attn/Gather_5_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "/blocks.21/self_attn/Reshape_7_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/Add_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape9343", "Rank9345", "BinaryOp9347", "Unsqueeze9348", "BinaryOp9350", "Unsqueeze9351", "StridedSlice9354", "Squeeze9355", "BinaryOp9357", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze9365", "Unsqueeze9368", "StridedSlice9371", "Squeeze9372", "BinaryOp9373", "BinaryOp9374", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/q_norm/Cast_output_0", "/blocks.22/self_attn/q_norm/Mul_1_output_0", "Unsqueeze9392", "Unsqueeze9395", "StridedSlice9398", "Squeeze9399", "BinaryOp9401", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape9525", "Rank9527", "BinaryOp9529", "Unsqueeze9530", "BinaryOp9532", "Unsqueeze9533", "StridedSlice9536", "Squeeze9537", "BinaryOp9538", "BinaryOp9539", "/blocks.22/self_attn/Gather_4_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "Unsqueeze9434", "Unsqueeze9437", "StridedSlice9440", "Squeeze9441", "BinaryOp9442", "BinaryOp9443", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/k_norm/Cast_output_0", "/blocks.22/self_attn/k_norm/Mul_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape9405", "Rank9407", "BinaryOp9409", "Unsqueeze9410", "BinaryOp9412", "Unsqueeze9413", "StridedSlice9416", "Squeeze9417", "BinaryOp9418", "BinaryOp9419", "/blocks.22/self_attn/Gather_5_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "/blocks.22/self_attn/Reshape_7_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/Add_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape9764", "Rank9766", "BinaryOp9768", "Unsqueeze9769", "BinaryOp9771", "Unsqueeze9772", "StridedSlice9775", "Squeeze9776", "BinaryOp9778", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze9786", "Unsqueeze9789", "StridedSlice9792", "Squeeze9793", "BinaryOp9794", "BinaryOp9795", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/q_norm/Cast_output_0", "/blocks.23/self_attn/q_norm/Mul_1_output_0", "Unsqueeze9813", "Unsqueeze9816", "StridedSlice9819", "Squeeze9820", "BinaryOp9822", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape9946", "Rank9948", "BinaryOp9950", "Unsqueeze9951", "BinaryOp9953", "Unsqueeze9954", "StridedSlice9957", "Squeeze9958", "BinaryOp9959", "BinaryOp9960", "/blocks.23/self_attn/Gather_4_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "Unsqueeze9855", "Unsqueeze9858", "StridedSlice9861", "Squeeze9862", "BinaryOp9863", "BinaryOp9864", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/k_norm/Cast_output_0", "/blocks.23/self_attn/k_norm/Mul_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape9826", "Rank9828", "BinaryOp9830", "Unsqueeze9831", "BinaryOp9833", "Unsqueeze9834", "StridedSlice9837", "Squeeze9838", "BinaryOp9839", "BinaryOp9840", "/blocks.23/self_attn/Gather_5_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "/blocks.23/self_attn/Reshape_7_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/Add_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape10185", "Rank10187", "BinaryOp10189", "Unsqueeze10190", "BinaryOp10192", "Unsqueeze10193", "StridedSlice10196", "Squeeze10197", "BinaryOp10199", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze10207", "Unsqueeze10210", "StridedSlice10213", "Squeeze10214", "BinaryOp10215", "BinaryOp10216", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/q_norm/Cast_output_0", "/blocks.24/self_attn/q_norm/Mul_1_output_0", "Unsqueeze10234", "Unsqueeze10237", "StridedSlice10240", "Squeeze10241", "BinaryOp10243", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape10367", "Rank10369", "BinaryOp10371", "Unsqueeze10372", "BinaryOp10374", "Unsqueeze10375", "StridedSlice10378", "Squeeze10379", "BinaryOp10380", "BinaryOp10381", "/blocks.24/self_attn/Gather_4_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "Unsqueeze10276", "Unsqueeze10279", "StridedSlice10282", "Squeeze10283", "BinaryOp10284", "BinaryOp10285", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/k_norm/Cast_output_0", "/blocks.24/self_attn/k_norm/Mul_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape10247", "Rank10249", "BinaryOp10251", "Unsqueeze10252", "BinaryOp10254", "Unsqueeze10255", "StridedSlice10258", "Squeeze10259", "BinaryOp10260", "BinaryOp10261", "/blocks.24/self_attn/Gather_5_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "/blocks.24/self_attn/Reshape_7_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/Add_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape10606", "Rank10608", "BinaryOp10610", "Unsqueeze10611", "BinaryOp10613", "Unsqueeze10614", "StridedSlice10617", "Squeeze10618", "BinaryOp10620", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze10628", "Unsqueeze10631", "StridedSlice10634", "Squeeze10635", "BinaryOp10636", "BinaryOp10637", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/q_norm/Cast_output_0", "/blocks.25/self_attn/q_norm/Mul_1_output_0", "Unsqueeze10655", "Unsqueeze10658", "StridedSlice10661", "Squeeze10662", "BinaryOp10664", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape10788", "Rank10790", "BinaryOp10792", "Unsqueeze10793", "BinaryOp10795", "Unsqueeze10796", "StridedSlice10799", "Squeeze10800", "BinaryOp10801", "BinaryOp10802", "/blocks.25/self_attn/Gather_4_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "Unsqueeze10697", "Unsqueeze10700", "StridedSlice10703", "Squeeze10704", "BinaryOp10705", "BinaryOp10706", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/k_norm/Cast_output_0", "/blocks.25/self_attn/k_norm/Mul_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape10668", "Rank10670", "BinaryOp10672", "Unsqueeze10673", "BinaryOp10675", "Unsqueeze10676", "StridedSlice10679", "Squeeze10680", "BinaryOp10681", "BinaryOp10682", "/blocks.25/self_attn/Gather_5_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "/blocks.25/self_attn/Reshape_7_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/Add_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/Add_1_output_0", "/blocks.26/Reshape_output_0", "/blocks.26/input_layernorm/Mul_1_output_0", "/blocks.26/self_attn/q_proj/FakeLinear_output_0", "/blocks.26/self_attn/Shape_output_0", "Shape11027", "Rank11029", "BinaryOp11031", "Unsqueeze11032", "BinaryOp11034", "Unsqueeze11035", "StridedSlice11038", "Squeeze11039", "BinaryOp11041", "/blocks.26/self_attn/Gather_output_0", "/blocks.26/self_attn/Unsqueeze_output_0", "Unsqueeze11049", "Unsqueeze11052", "StridedSlice11055", "Squeeze11056", "BinaryOp11057", "BinaryOp11058", "/blocks.26/self_attn/Gather_1_output_0", "/blocks.26/self_attn/Unsqueeze_1_output_0", "/blocks.26/self_attn/Concat_output_0", "/blocks.26/self_attn/Reshape_output_0", "/blocks.26/self_attn/q_norm/Cast_output_0", "/blocks.26/self_attn/q_norm/Mul_1_output_0", "Unsqueeze11076", "Unsqueeze11079", "StridedSlice11082", "Squeeze11083", "BinaryOp11085", "/blocks.26/self_attn/Gather_2_output_0", "/blocks.26/self_attn/Mul_output_0", "/blocks.26/self_attn/Shape_2_output_0", "Shape11209", "Rank11211", "BinaryOp11213", "Unsqueeze11214", "BinaryOp11216", "Unsqueeze11217", "StridedSlice11220", "Squeeze11221", "BinaryOp11222", "BinaryOp11223", "/blocks.26/self_attn/Gather_4_output_0", "/blocks.26/self_attn/Div_output_0", "/blocks.26/self_attn/Unsqueeze_7_output_0", "/blocks.26/self_attn/Slice_1_output_0", "/blocks.26/self_attn/Neg_output_0", "/blocks.26/self_attn/Unsqueeze_6_output_0", "/blocks.26/self_attn/Slice_output_0", "/blocks.26/self_attn/Concat_3_output_0", "Unsqueeze11118", "Unsqueeze11121", "StridedSlice11124", "Squeeze11125", "BinaryOp11126", "BinaryOp11127", "/blocks.26/self_attn/Gather_3_output_0", "/blocks.26/self_attn/Mul_1_output_0", "/blocks.26/self_attn/Add_output_0", "/blocks.26/self_attn/k_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_2_output_0", "/blocks.26/self_attn/Unsqueeze_3_output_0", "/blocks.26/self_attn/Concat_1_output_0", "/blocks.26/self_attn/Reshape_1_output_0", "/blocks.26/self_attn/k_norm/Cast_output_0", "/blocks.26/self_attn/k_norm/Mul_1_output_0", "/blocks.26/self_attn/Mul_2_output_0", "/blocks.26/self_attn/Shape_3_output_0", "Shape11089", "Rank11091", "BinaryOp11093", "Unsqueeze11094", "BinaryOp11096", "Unsqueeze11097", "StridedSlice11100", "Squeeze11101", "BinaryOp11102", "BinaryOp11103", "/blocks.26/self_attn/Gather_5_output_0", "/blocks.26/self_attn/Div_1_output_0", "/blocks.26/self_attn/Unsqueeze_9_output_0", "/blocks.26/self_attn/Slice_3_output_0", "/blocks.26/self_attn/Neg_1_output_0", "/blocks.26/self_attn/Unsqueeze_8_output_0", "/blocks.26/self_attn/Slice_2_output_0", "/blocks.26/self_attn/Concat_4_output_0", "/blocks.26/self_attn/Mul_3_output_0", "/blocks.26/self_attn/Add_1_output_0", "/blocks.26/self_attn/v_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_4_output_0", "/blocks.26/self_attn/Unsqueeze_5_output_0", "/blocks.26/self_attn/Concat_2_output_0", "/blocks.26/self_attn/Reshape_2_output_0", "/blocks.26/self_attn/Reshape_7_output_0", "/blocks.26/self_attn/o_proj/FakeLinear_output_0", "/blocks.26/Add_output_0", "/blocks.26/post_attention_layernorm/Mul_1_output_0", "/blocks.26/mlp/gate_proj/FakeLinear_output_0", "/blocks.26/mlp/act_fn/Mul_output_0", "/blocks.26/mlp/up_proj/FakeLinear_output_0", "/blocks.26/mlp/Mul_output_0", "/blocks.26/mlp/down_proj/FakeLinear_output_0", "/blocks.26/Add_1_output_0", "/blocks.27/Reshape_output_0", "/blocks.27/input_layernorm/Mul_1_output_0", "/blocks.27/self_attn/q_proj/FakeLinear_output_0", "/blocks.27/self_attn/Shape_output_0", "Shape11448", "Rank11450", "BinaryOp11452", "Unsqueeze11453", "BinaryOp11455", "Unsqueeze11456", "StridedSlice11459", "Squeeze11460", "BinaryOp11462", "/blocks.27/self_attn/Gather_output_0", "/blocks.27/self_attn/Unsqueeze_output_0", "Unsqueeze11470", "Unsqueeze11473", "StridedSlice11476", "Squeeze11477", "BinaryOp11478", "BinaryOp11479", "/blocks.27/self_attn/Gather_1_output_0", "/blocks.27/self_attn/Unsqueeze_1_output_0", "/blocks.27/self_attn/Concat_output_0", "/blocks.27/self_attn/Reshape_output_0", "/blocks.27/self_attn/q_norm/Cast_output_0", "/blocks.27/self_attn/q_norm/Mul_1_output_0", "Unsqueeze11497", "Unsqueeze11500", "StridedSlice11503", "Squeeze11504", "BinaryOp11506", "/blocks.27/self_attn/Gather_2_output_0", "/blocks.27/self_attn/Mul_output_0", "/blocks.27/self_attn/Shape_2_output_0", "Shape11630", "Rank11632", "BinaryOp11634", "Unsqueeze11635", "BinaryOp11637", "Unsqueeze11638", "StridedSlice11641", "Squeeze11642", "BinaryOp11643", "BinaryOp11644", "/blocks.27/self_attn/Gather_4_output_0", "/blocks.27/self_attn/Div_output_0", "/blocks.27/self_attn/Unsqueeze_7_output_0", "/blocks.27/self_attn/Slice_1_output_0", "/blocks.27/self_attn/Neg_output_0", "/blocks.27/self_attn/Unsqueeze_6_output_0", "/blocks.27/self_attn/Slice_output_0", "/blocks.27/self_attn/Concat_3_output_0", "Unsqueeze11539", "Unsqueeze11542", "StridedSlice11545", "Squeeze11546", "BinaryOp11547", "BinaryOp11548", "/blocks.27/self_attn/Gather_3_output_0", "/blocks.27/self_attn/Mul_1_output_0", "/blocks.27/self_attn/Add_output_0", "/blocks.27/self_attn/k_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_2_output_0", "/blocks.27/self_attn/Unsqueeze_3_output_0", "/blocks.27/self_attn/Concat_1_output_0", "/blocks.27/self_attn/Reshape_1_output_0", "/blocks.27/self_attn/k_norm/Cast_output_0", "/blocks.27/self_attn/k_norm/Mul_1_output_0", "/blocks.27/self_attn/Mul_2_output_0", "/blocks.27/self_attn/Shape_3_output_0", "Shape11510", "Rank11512", "BinaryOp11514", "Unsqueeze11515", "BinaryOp11517", "Unsqueeze11518", "StridedSlice11521", "Squeeze11522", "BinaryOp11523", "BinaryOp11524", "/blocks.27/self_attn/Gather_5_output_0", "/blocks.27/self_attn/Div_1_output_0", "/blocks.27/self_attn/Unsqueeze_9_output_0", "/blocks.27/self_attn/Slice_3_output_0", "/blocks.27/self_attn/Neg_1_output_0", "/blocks.27/self_attn/Unsqueeze_8_output_0", "/blocks.27/self_attn/Slice_2_output_0", "/blocks.27/self_attn/Concat_4_output_0", "/blocks.27/self_attn/Mul_3_output_0", "/blocks.27/self_attn/Add_1_output_0", "/blocks.27/self_attn/v_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_4_output_0", "/blocks.27/self_attn/Unsqueeze_5_output_0", "/blocks.27/self_attn/Concat_2_output_0", "/blocks.27/self_attn/Reshape_2_output_0", "/blocks.27/self_attn/Reshape_7_output_0", "/blocks.27/self_attn/o_proj/FakeLinear_output_0", "/blocks.27/Add_output_0", "/blocks.27/post_attention_layernorm/Mul_1_output_0", "/blocks.27/mlp/gate_proj/FakeLinear_output_0", "/blocks.27/mlp/act_fn/Mul_output_0", "/blocks.27/mlp/up_proj/FakeLinear_output_0", "/blocks.27/mlp/Mul_output_0", "/blocks.27/mlp/down_proj/FakeLinear_output_0", "/blocks.27/Add_1_output_0", "/blocks.28/Reshape_output_0", "/blocks.28/input_layernorm/Mul_1_output_0", "/blocks.28/self_attn/q_proj/FakeLinear_output_0", "/blocks.28/self_attn/Shape_output_0", "Shape11869", "Rank11871", "BinaryOp11873", "Unsqueeze11874", "BinaryOp11876", "Unsqueeze11877", "StridedSlice11880", "Squeeze11881", "BinaryOp11883", "/blocks.28/self_attn/Gather_output_0", "/blocks.28/self_attn/Unsqueeze_output_0", "Unsqueeze11891", "Unsqueeze11894", "StridedSlice11897", "Squeeze11898", "BinaryOp11899", "BinaryOp11900", "/blocks.28/self_attn/Gather_1_output_0", "/blocks.28/self_attn/Unsqueeze_1_output_0", "/blocks.28/self_attn/Concat_output_0", "/blocks.28/self_attn/Reshape_output_0", "/blocks.28/self_attn/q_norm/Cast_output_0", "/blocks.28/self_attn/q_norm/Mul_1_output_0", "Unsqueeze11918", "Unsqueeze11921", "StridedSlice11924", "Squeeze11925", "BinaryOp11927", "/blocks.28/self_attn/Gather_2_output_0", "/blocks.28/self_attn/Mul_output_0", "/blocks.28/self_attn/Shape_2_output_0", "Shape12051", "Rank12053", "BinaryOp12055", "Unsqueeze12056", "BinaryOp12058", "Unsqueeze12059", "StridedSlice12062", "Squeeze12063", "BinaryOp12064", "BinaryOp12065", "/blocks.28/self_attn/Gather_4_output_0", "/blocks.28/self_attn/Div_output_0", "/blocks.28/self_attn/Unsqueeze_7_output_0", "/blocks.28/self_attn/Slice_1_output_0", "/blocks.28/self_attn/Neg_output_0", "/blocks.28/self_attn/Unsqueeze_6_output_0", "/blocks.28/self_attn/Slice_output_0", "/blocks.28/self_attn/Concat_3_output_0", "Unsqueeze11960", "Unsqueeze11963", "StridedSlice11966", "Squeeze11967", "BinaryOp11968", "BinaryOp11969", "/blocks.28/self_attn/Gather_3_output_0", "/blocks.28/self_attn/Mul_1_output_0", "/blocks.28/self_attn/Add_output_0", "/blocks.28/self_attn/k_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_2_output_0", "/blocks.28/self_attn/Unsqueeze_3_output_0", "/blocks.28/self_attn/Concat_1_output_0", "/blocks.28/self_attn/Reshape_1_output_0", "/blocks.28/self_attn/k_norm/Cast_output_0", "/blocks.28/self_attn/k_norm/Mul_1_output_0", "/blocks.28/self_attn/Mul_2_output_0", "/blocks.28/self_attn/Shape_3_output_0", "Shape11931", "Rank11933", "BinaryOp11935", "Unsqueeze11936", "BinaryOp11938", "Unsqueeze11939", "StridedSlice11942", "Squeeze11943", "BinaryOp11944", "BinaryOp11945", "/blocks.28/self_attn/Gather_5_output_0", "/blocks.28/self_attn/Div_1_output_0", "/blocks.28/self_attn/Unsqueeze_9_output_0", "/blocks.28/self_attn/Slice_3_output_0", "/blocks.28/self_attn/Neg_1_output_0", "/blocks.28/self_attn/Unsqueeze_8_output_0", "/blocks.28/self_attn/Slice_2_output_0", "/blocks.28/self_attn/Concat_4_output_0", "/blocks.28/self_attn/Mul_3_output_0", "/blocks.28/self_attn/Add_1_output_0", "/blocks.28/self_attn/v_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_4_output_0", "/blocks.28/self_attn/Unsqueeze_5_output_0", "/blocks.28/self_attn/Concat_2_output_0", "/blocks.28/self_attn/Reshape_2_output_0", "/blocks.28/self_attn/Reshape_7_output_0", "/blocks.28/self_attn/o_proj/FakeLinear_output_0", "/blocks.28/Add_output_0", "/blocks.28/post_attention_layernorm/Mul_1_output_0", "/blocks.28/mlp/gate_proj/FakeLinear_output_0", "/blocks.28/mlp/act_fn/Mul_output_0", "/blocks.28/mlp/up_proj/FakeLinear_output_0", "/blocks.28/mlp/Mul_output_0", "/blocks.28/mlp/down_proj/FakeLinear_output_0", "/blocks.28/Add_1_output_0", "/blocks.29/Reshape_output_0", "/blocks.29/input_layernorm/Mul_1_output_0", "/blocks.29/self_attn/q_proj/FakeLinear_output_0", "/blocks.29/self_attn/Shape_output_0", "Shape12290", "Rank12292", "BinaryOp12294", "Unsqueeze12295", "BinaryOp12297", "Unsqueeze12298", "StridedSlice12301", "Squeeze12302", "BinaryOp12304", "/blocks.29/self_attn/Gather_output_0", "/blocks.29/self_attn/Unsqueeze_output_0", "Unsqueeze12312", "Unsqueeze12315", "StridedSlice12318", "Squeeze12319", "BinaryOp12320", "BinaryOp12321", "/blocks.29/self_attn/Gather_1_output_0", "/blocks.29/self_attn/Unsqueeze_1_output_0", "/blocks.29/self_attn/Concat_output_0", "/blocks.29/self_attn/Reshape_output_0", "/blocks.29/self_attn/q_norm/Cast_output_0", "/blocks.29/self_attn/q_norm/Mul_1_output_0", "Unsqueeze12339", "Unsqueeze12342", "StridedSlice12345", "Squeeze12346", "BinaryOp12348", "/blocks.29/self_attn/Gather_2_output_0", "/blocks.29/self_attn/Mul_output_0", "/blocks.29/self_attn/Shape_2_output_0", "Shape12472", "Rank12474", "BinaryOp12476", "Unsqueeze12477", "BinaryOp12479", "Unsqueeze12480", "StridedSlice12483", "Squeeze12484", "BinaryOp12485", "BinaryOp12486", "/blocks.29/self_attn/Gather_4_output_0", "/blocks.29/self_attn/Div_output_0", "/blocks.29/self_attn/Unsqueeze_7_output_0", "/blocks.29/self_attn/Slice_1_output_0", "/blocks.29/self_attn/Neg_output_0", "/blocks.29/self_attn/Unsqueeze_6_output_0", "/blocks.29/self_attn/Slice_output_0", "/blocks.29/self_attn/Concat_3_output_0", "Unsqueeze12381", "Unsqueeze12384", "StridedSlice12387", "Squeeze12388", "BinaryOp12389", "BinaryOp12390", "/blocks.29/self_attn/Gather_3_output_0", "/blocks.29/self_attn/Mul_1_output_0", "/blocks.29/self_attn/Add_output_0", "/blocks.29/self_attn/k_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_2_output_0", "/blocks.29/self_attn/Unsqueeze_3_output_0", "/blocks.29/self_attn/Concat_1_output_0", "/blocks.29/self_attn/Reshape_1_output_0", "/blocks.29/self_attn/k_norm/Cast_output_0", "/blocks.29/self_attn/k_norm/Mul_1_output_0", "/blocks.29/self_attn/Mul_2_output_0", "/blocks.29/self_attn/Shape_3_output_0", "Shape12352", "Rank12354", "BinaryOp12356", "Unsqueeze12357", "BinaryOp12359", "Unsqueeze12360", "StridedSlice12363", "Squeeze12364", "BinaryOp12365", "BinaryOp12366", "/blocks.29/self_attn/Gather_5_output_0", "/blocks.29/self_attn/Div_1_output_0", "/blocks.29/self_attn/Unsqueeze_9_output_0", "/blocks.29/self_attn/Slice_3_output_0", "/blocks.29/self_attn/Neg_1_output_0", "/blocks.29/self_attn/Unsqueeze_8_output_0", "/blocks.29/self_attn/Slice_2_output_0", "/blocks.29/self_attn/Concat_4_output_0", "/blocks.29/self_attn/Mul_3_output_0", "/blocks.29/self_attn/Add_1_output_0", "/blocks.29/self_attn/v_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_4_output_0", "/blocks.29/self_attn/Unsqueeze_5_output_0", "/blocks.29/self_attn/Concat_2_output_0", "/blocks.29/self_attn/Reshape_2_output_0", "/blocks.29/self_attn/Reshape_7_output_0", "/blocks.29/self_attn/o_proj/FakeLinear_output_0", "/blocks.29/Add_output_0", "/blocks.29/post_attention_layernorm/Mul_1_output_0", "/blocks.29/mlp/gate_proj/FakeLinear_output_0", "/blocks.29/mlp/act_fn/Mul_output_0", "/blocks.29/mlp/up_proj/FakeLinear_output_0", "/blocks.29/mlp/Mul_output_0", "/blocks.29/mlp/down_proj/FakeLinear_output_0", "/blocks.29/Add_1_output_0", "/blocks.30/Reshape_output_0", "/blocks.30/input_layernorm/Mul_1_output_0", "/blocks.30/self_attn/q_proj/FakeLinear_output_0", "/blocks.30/self_attn/Shape_output_0", "Shape12711", "Rank12713", "BinaryOp12715", "Unsqueeze12716", "BinaryOp12718", "Unsqueeze12719", "StridedSlice12722", "Squeeze12723", "BinaryOp12725", "/blocks.30/self_attn/Gather_output_0", "/blocks.30/self_attn/Unsqueeze_output_0", "Unsqueeze12733", "Unsqueeze12736", "StridedSlice12739", "Squeeze12740", "BinaryOp12741", "BinaryOp12742", "/blocks.30/self_attn/Gather_1_output_0", "/blocks.30/self_attn/Unsqueeze_1_output_0", "/blocks.30/self_attn/Concat_output_0", "/blocks.30/self_attn/Reshape_output_0", "/blocks.30/self_attn/q_norm/Cast_output_0", "/blocks.30/self_attn/q_norm/Mul_1_output_0", "Unsqueeze12760", "Unsqueeze12763", "StridedSlice12766", "Squeeze12767", "BinaryOp12769", "/blocks.30/self_attn/Gather_2_output_0", "/blocks.30/self_attn/Mul_output_0", "/blocks.30/self_attn/Shape_2_output_0", "Shape12893", "Rank12895", "BinaryOp12897", "Unsqueeze12898", "BinaryOp12900", "Unsqueeze12901", "StridedSlice12904", "Squeeze12905", "BinaryOp12906", "BinaryOp12907", "/blocks.30/self_attn/Gather_4_output_0", "/blocks.30/self_attn/Div_output_0", "/blocks.30/self_attn/Unsqueeze_7_output_0", "/blocks.30/self_attn/Slice_1_output_0", "/blocks.30/self_attn/Neg_output_0", "/blocks.30/self_attn/Unsqueeze_6_output_0", "/blocks.30/self_attn/Slice_output_0", "/blocks.30/self_attn/Concat_3_output_0", "Unsqueeze12802", "Unsqueeze12805", "StridedSlice12808", "Squeeze12809", "BinaryOp12810", "BinaryOp12811", "/blocks.30/self_attn/Gather_3_output_0", "/blocks.30/self_attn/Mul_1_output_0", "/blocks.30/self_attn/Add_output_0", "/blocks.30/self_attn/k_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_2_output_0", "/blocks.30/self_attn/Unsqueeze_3_output_0", "/blocks.30/self_attn/Concat_1_output_0", "/blocks.30/self_attn/Reshape_1_output_0", "/blocks.30/self_attn/k_norm/Cast_output_0", "/blocks.30/self_attn/k_norm/Mul_1_output_0", "/blocks.30/self_attn/Mul_2_output_0", "/blocks.30/self_attn/Shape_3_output_0", "Shape12773", "Rank12775", "BinaryOp12777", "Unsqueeze12778", "BinaryOp12780", "Unsqueeze12781", "StridedSlice12784", "Squeeze12785", "BinaryOp12786", "BinaryOp12787", "/blocks.30/self_attn/Gather_5_output_0", "/blocks.30/self_attn/Div_1_output_0", "/blocks.30/self_attn/Unsqueeze_9_output_0", "/blocks.30/self_attn/Slice_3_output_0", "/blocks.30/self_attn/Neg_1_output_0", "/blocks.30/self_attn/Unsqueeze_8_output_0", "/blocks.30/self_attn/Slice_2_output_0", "/blocks.30/self_attn/Concat_4_output_0", "/blocks.30/self_attn/Mul_3_output_0", "/blocks.30/self_attn/Add_1_output_0", "/blocks.30/self_attn/v_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_4_output_0", "/blocks.30/self_attn/Unsqueeze_5_output_0", "/blocks.30/self_attn/Concat_2_output_0", "/blocks.30/self_attn/Reshape_2_output_0", "/blocks.30/self_attn/Reshape_7_output_0", "/blocks.30/self_attn/o_proj/FakeLinear_output_0", "/blocks.30/Add_output_0", "/blocks.30/post_attention_layernorm/Mul_1_output_0", "/blocks.30/mlp/gate_proj/FakeLinear_output_0", "/blocks.30/mlp/act_fn/Mul_output_0", "/blocks.30/mlp/up_proj/FakeLinear_output_0", "/blocks.30/mlp/Mul_output_0", "/blocks.30/mlp/down_proj/FakeLinear_output_0", "/blocks.30/Add_1_output_0", "/blocks.31/Reshape_output_0", "/blocks.31/input_layernorm/Mul_1_output_0", "/blocks.31/self_attn/q_proj/FakeLinear_output_0", "/blocks.31/self_attn/Shape_output_0", "Shape13132", "Rank13134", "BinaryOp13136", "Unsqueeze13137", "BinaryOp13139", "Unsqueeze13140", "StridedSlice13143", "Squeeze13144", "BinaryOp13146", "/blocks.31/self_attn/Gather_output_0", "/blocks.31/self_attn/Unsqueeze_output_0", "Unsqueeze13154", "Unsqueeze13157", "StridedSlice13160", "Squeeze13161", "BinaryOp13162", "BinaryOp13163", "/blocks.31/self_attn/Gather_1_output_0", "/blocks.31/self_attn/Unsqueeze_1_output_0", "/blocks.31/self_attn/Concat_output_0", "/blocks.31/self_attn/Reshape_output_0", "/blocks.31/self_attn/q_norm/Cast_output_0", "/blocks.31/self_attn/q_norm/Mul_1_output_0", "Unsqueeze13181", "Unsqueeze13184", "StridedSlice13187", "Squeeze13188", "BinaryOp13190", "/blocks.31/self_attn/Gather_2_output_0", "/blocks.31/self_attn/Mul_output_0", "/blocks.31/self_attn/Shape_2_output_0", "Shape13314", "Rank13316", "BinaryOp13318", "Unsqueeze13319", "BinaryOp13321", "Unsqueeze13322", "StridedSlice13325", "Squeeze13326", "BinaryOp13327", "BinaryOp13328", "/blocks.31/self_attn/Gather_4_output_0", "/blocks.31/self_attn/Div_output_0", "/blocks.31/self_attn/Unsqueeze_7_output_0", "/blocks.31/self_attn/Slice_1_output_0", "/blocks.31/self_attn/Neg_output_0", "/blocks.31/self_attn/Unsqueeze_6_output_0", "/blocks.31/self_attn/Slice_output_0", "/blocks.31/self_attn/Concat_3_output_0", "Unsqueeze13223", "Unsqueeze13226", "StridedSlice13229", "Squeeze13230", "BinaryOp13231", "BinaryOp13232", "/blocks.31/self_attn/Gather_3_output_0", "/blocks.31/self_attn/Mul_1_output_0", "/blocks.31/self_attn/Add_output_0", "/blocks.31/self_attn/k_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_2_output_0", "/blocks.31/self_attn/Unsqueeze_3_output_0", "/blocks.31/self_attn/Concat_1_output_0", "/blocks.31/self_attn/Reshape_1_output_0", "/blocks.31/self_attn/k_norm/Cast_output_0", "/blocks.31/self_attn/k_norm/Mul_1_output_0", "/blocks.31/self_attn/Mul_2_output_0", "/blocks.31/self_attn/Shape_3_output_0", "Shape13194", "Rank13196", "BinaryOp13198", "Unsqueeze13199", "BinaryOp13201", "Unsqueeze13202", "StridedSlice13205", "Squeeze13206", "BinaryOp13207", "BinaryOp13208", "/blocks.31/self_attn/Gather_5_output_0", "/blocks.31/self_attn/Div_1_output_0", "/blocks.31/self_attn/Unsqueeze_9_output_0", "/blocks.31/self_attn/Slice_3_output_0", "/blocks.31/self_attn/Neg_1_output_0", "/blocks.31/self_attn/Unsqueeze_8_output_0", "/blocks.31/self_attn/Slice_2_output_0", "/blocks.31/self_attn/Concat_4_output_0", "/blocks.31/self_attn/Mul_3_output_0", "/blocks.31/self_attn/Add_1_output_0", "/blocks.31/self_attn/v_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_4_output_0", "/blocks.31/self_attn/Unsqueeze_5_output_0", "/blocks.31/self_attn/Concat_2_output_0", "/blocks.31/self_attn/Reshape_2_output_0", "/blocks.31/self_attn/Reshape_7_output_0", "/blocks.31/self_attn/o_proj/FakeLinear_output_0", "/blocks.31/Add_output_0", "/blocks.31/post_attention_layernorm/Mul_1_output_0", "/blocks.31/mlp/gate_proj/FakeLinear_output_0", "/blocks.31/mlp/act_fn/Mul_output_0", "/blocks.31/mlp/up_proj/FakeLinear_output_0", "/blocks.31/mlp/Mul_output_0", "/blocks.31/mlp/down_proj/FakeLinear_output_0", "/blocks.31/Add_1_output_0", "/blocks.32/Reshape_output_0", "/blocks.32/input_layernorm/Mul_1_output_0", "/blocks.32/self_attn/q_proj/FakeLinear_output_0", "/blocks.32/self_attn/Shape_output_0", "Shape13553", "Rank13555", "BinaryOp13557", "Unsqueeze13558", "BinaryOp13560", "Unsqueeze13561", "StridedSlice13564", "Squeeze13565", "BinaryOp13567", "/blocks.32/self_attn/Gather_output_0", "/blocks.32/self_attn/Unsqueeze_output_0", "Unsqueeze13575", "Unsqueeze13578", "StridedSlice13581", "Squeeze13582", "BinaryOp13583", "BinaryOp13584", "/blocks.32/self_attn/Gather_1_output_0", "/blocks.32/self_attn/Unsqueeze_1_output_0", "/blocks.32/self_attn/Concat_output_0", "/blocks.32/self_attn/Reshape_output_0", "/blocks.32/self_attn/q_norm/Cast_output_0", "/blocks.32/self_attn/q_norm/Mul_1_output_0", "Unsqueeze13602", "Unsqueeze13605", "StridedSlice13608", "Squeeze13609", "BinaryOp13611", "/blocks.32/self_attn/Gather_2_output_0", "/blocks.32/self_attn/Mul_output_0", "/blocks.32/self_attn/Shape_2_output_0", "Shape13735", "Rank13737", "BinaryOp13739", "Unsqueeze13740", "BinaryOp13742", "Unsqueeze13743", "StridedSlice13746", "Squeeze13747", "BinaryOp13748", "BinaryOp13749", "/blocks.32/self_attn/Gather_4_output_0", "/blocks.32/self_attn/Div_output_0", "/blocks.32/self_attn/Unsqueeze_7_output_0", "/blocks.32/self_attn/Slice_1_output_0", "/blocks.32/self_attn/Neg_output_0", "/blocks.32/self_attn/Unsqueeze_6_output_0", "/blocks.32/self_attn/Slice_output_0", "/blocks.32/self_attn/Concat_3_output_0", "Unsqueeze13644", "Unsqueeze13647", "StridedSlice13650", "Squeeze13651", "BinaryOp13652", "BinaryOp13653", "/blocks.32/self_attn/Gather_3_output_0", "/blocks.32/self_attn/Mul_1_output_0", "/blocks.32/self_attn/Add_output_0", "/blocks.32/self_attn/k_proj/FakeLinear_output_0", "/blocks.32/self_attn/Unsqueeze_2_output_0", "/blocks.32/self_attn/Unsqueeze_3_output_0", "/blocks.32/self_attn/Concat_1_output_0", "/blocks.32/self_attn/Reshape_1_output_0", "/blocks.32/self_attn/k_norm/Cast_output_0", "/blocks.32/self_attn/k_norm/Mul_1_output_0", "/blocks.32/self_attn/Mul_2_output_0", "/blocks.32/self_attn/Shape_3_output_0", "Shape13615", "Rank13617", "BinaryOp13619", "Unsqueeze13620", "BinaryOp13622", "Unsqueeze13623", "StridedSlice13626", "Squeeze13627", "BinaryOp13628", "BinaryOp13629", "/blocks.32/self_attn/Gather_5_output_0", "/blocks.32/self_attn/Div_1_output_0", "/blocks.32/self_attn/Unsqueeze_9_output_0", "/blocks.32/self_attn/Slice_3_output_0", "/blocks.32/self_attn/Neg_1_output_0", "/blocks.32/self_attn/Unsqueeze_8_output_0", "/blocks.32/self_attn/Slice_2_output_0", "/blocks.32/self_attn/Concat_4_output_0", "/blocks.32/self_attn/Mul_3_output_0", "/blocks.32/self_attn/Add_1_output_0", "/blocks.32/self_attn/v_proj/FakeLinear_output_0", "/blocks.32/self_attn/Unsqueeze_4_output_0", "/blocks.32/self_attn/Unsqueeze_5_output_0", "/blocks.32/self_attn/Concat_2_output_0", "/blocks.32/self_attn/Reshape_2_output_0", "/blocks.32/self_attn/Reshape_7_output_0", "/blocks.32/self_attn/o_proj/FakeLinear_output_0", "/blocks.32/Add_output_0", "/blocks.32/post_attention_layernorm/Mul_1_output_0", "/blocks.32/mlp/gate_proj/FakeLinear_output_0", "/blocks.32/mlp/act_fn/Mul_output_0", "/blocks.32/mlp/up_proj/FakeLinear_output_0", "/blocks.32/mlp/Mul_output_0", "/blocks.32/mlp/down_proj/FakeLinear_output_0", "/blocks.32/Add_1_output_0", "/blocks.33/Reshape_output_0", "/blocks.33/input_layernorm/Mul_1_output_0", "/blocks.33/self_attn/q_proj/FakeLinear_output_0", "/blocks.33/self_attn/Shape_output_0", "Shape13974", "Rank13976", "BinaryOp13978", "Unsqueeze13979", "BinaryOp13981", "Unsqueeze13982", "StridedSlice13985", "Squeeze13986", "BinaryOp13988", "/blocks.33/self_attn/Gather_output_0", "/blocks.33/self_attn/Unsqueeze_output_0", "Unsqueeze13996", "Unsqueeze13999", "StridedSlice14002", "Squeeze14003", "BinaryOp14004", "BinaryOp14005", "/blocks.33/self_attn/Gather_1_output_0", "/blocks.33/self_attn/Unsqueeze_1_output_0", "/blocks.33/self_attn/Concat_output_0", "/blocks.33/self_attn/Reshape_output_0", "/blocks.33/self_attn/q_norm/Cast_output_0", "/blocks.33/self_attn/q_norm/Mul_1_output_0", "Unsqueeze14023", "Unsqueeze14026", "StridedSlice14029", "Squeeze14030", "BinaryOp14032", "/blocks.33/self_attn/Gather_2_output_0", "/blocks.33/self_attn/Mul_output_0", "/blocks.33/self_attn/Shape_2_output_0", "Shape14156", "Rank14158", "BinaryOp14160", "Unsqueeze14161", "BinaryOp14163", "Unsqueeze14164", "StridedSlice14167", "Squeeze14168", "BinaryOp14169", "BinaryOp14170", "/blocks.33/self_attn/Gather_4_output_0", "/blocks.33/self_attn/Div_output_0", "/blocks.33/self_attn/Unsqueeze_7_output_0", "/blocks.33/self_attn/Slice_1_output_0", "/blocks.33/self_attn/Neg_output_0", "/blocks.33/self_attn/Unsqueeze_6_output_0", "/blocks.33/self_attn/Slice_output_0", "/blocks.33/self_attn/Concat_3_output_0", "Unsqueeze14065", "Unsqueeze14068", "StridedSlice14071", "Squeeze14072", "BinaryOp14073", "BinaryOp14074", "/blocks.33/self_attn/Gather_3_output_0", "/blocks.33/self_attn/Mul_1_output_0", "/blocks.33/self_attn/Add_output_0", "/blocks.33/self_attn/k_proj/FakeLinear_output_0", "/blocks.33/self_attn/Unsqueeze_2_output_0", "/blocks.33/self_attn/Unsqueeze_3_output_0", "/blocks.33/self_attn/Concat_1_output_0", "/blocks.33/self_attn/Reshape_1_output_0", "/blocks.33/self_attn/k_norm/Cast_output_0", "/blocks.33/self_attn/k_norm/Mul_1_output_0", "/blocks.33/self_attn/Mul_2_output_0", "/blocks.33/self_attn/Shape_3_output_0", "Shape14036", "Rank14038", "BinaryOp14040", "Unsqueeze14041", "BinaryOp14043", "Unsqueeze14044", "StridedSlice14047", "Squeeze14048", "BinaryOp14049", "BinaryOp14050", "/blocks.33/self_attn/Gather_5_output_0", "/blocks.33/self_attn/Div_1_output_0", "/blocks.33/self_attn/Unsqueeze_9_output_0", "/blocks.33/self_attn/Slice_3_output_0", "/blocks.33/self_attn/Neg_1_output_0", "/blocks.33/self_attn/Unsqueeze_8_output_0", "/blocks.33/self_attn/Slice_2_output_0", "/blocks.33/self_attn/Concat_4_output_0", "/blocks.33/self_attn/Mul_3_output_0", "/blocks.33/self_attn/Add_1_output_0", "/blocks.33/self_attn/v_proj/FakeLinear_output_0", "/blocks.33/self_attn/Unsqueeze_4_output_0", "/blocks.33/self_attn/Unsqueeze_5_output_0", "/blocks.33/self_attn/Concat_2_output_0", "/blocks.33/self_attn/Reshape_2_output_0", "/blocks.33/self_attn/Reshape_7_output_0", "/blocks.33/self_attn/o_proj/FakeLinear_output_0", "/blocks.33/Add_output_0", "/blocks.33/post_attention_layernorm/Mul_1_output_0", "/blocks.33/mlp/gate_proj/FakeLinear_output_0", "/blocks.33/mlp/act_fn/Mul_output_0", "/blocks.33/mlp/up_proj/FakeLinear_output_0", "/blocks.33/mlp/Mul_output_0", "/blocks.33/mlp/down_proj/FakeLinear_output_0", "/blocks.33/Add_1_output_0", "/blocks.34/Reshape_output_0", "/blocks.34/input_layernorm/Mul_1_output_0", "/blocks.34/self_attn/q_proj/FakeLinear_output_0", "/blocks.34/self_attn/Shape_output_0", "Shape14395", "Rank14397", "BinaryOp14399", "Unsqueeze14400", "BinaryOp14402", "Unsqueeze14403", "StridedSlice14406", "Squeeze14407", "BinaryOp14409", "/blocks.34/self_attn/Gather_output_0", "/blocks.34/self_attn/Unsqueeze_output_0", "Unsqueeze14417", "Unsqueeze14420", "StridedSlice14423", "Squeeze14424", "BinaryOp14425", "BinaryOp14426", "/blocks.34/self_attn/Gather_1_output_0", "/blocks.34/self_attn/Unsqueeze_1_output_0", "/blocks.34/self_attn/Concat_output_0", "/blocks.34/self_attn/Reshape_output_0", "/blocks.34/self_attn/q_norm/Cast_output_0", "/blocks.34/self_attn/q_norm/Mul_1_output_0", "Unsqueeze14444", "Unsqueeze14447", "StridedSlice14450", "Squeeze14451", "BinaryOp14453", "/blocks.34/self_attn/Gather_2_output_0", "/blocks.34/self_attn/Mul_output_0", "/blocks.34/self_attn/Shape_2_output_0", "Shape14577", "Rank14579", "BinaryOp14581", "Unsqueeze14582", "BinaryOp14584", "Unsqueeze14585", "StridedSlice14588", "Squeeze14589", "BinaryOp14590", "BinaryOp14591", "/blocks.34/self_attn/Gather_4_output_0", "/blocks.34/self_attn/Div_output_0", "/blocks.34/self_attn/Unsqueeze_7_output_0", "/blocks.34/self_attn/Slice_1_output_0", "/blocks.34/self_attn/Neg_output_0", "/blocks.34/self_attn/Unsqueeze_6_output_0", "/blocks.34/self_attn/Slice_output_0", "/blocks.34/self_attn/Concat_3_output_0", "Unsqueeze14486", "Unsqueeze14489", "StridedSlice14492", "Squeeze14493", "BinaryOp14494", "BinaryOp14495", "/blocks.34/self_attn/Gather_3_output_0", "/blocks.34/self_attn/Mul_1_output_0", "/blocks.34/self_attn/Add_output_0", "/blocks.34/self_attn/k_proj/FakeLinear_output_0", "/blocks.34/self_attn/Unsqueeze_2_output_0", "/blocks.34/self_attn/Unsqueeze_3_output_0", "/blocks.34/self_attn/Concat_1_output_0", "/blocks.34/self_attn/Reshape_1_output_0", "/blocks.34/self_attn/k_norm/Cast_output_0", "/blocks.34/self_attn/k_norm/Mul_1_output_0", "/blocks.34/self_attn/Mul_2_output_0", "/blocks.34/self_attn/Shape_3_output_0", "Shape14457", "Rank14459", "BinaryOp14461", "Unsqueeze14462", "BinaryOp14464", "Unsqueeze14465", "StridedSlice14468", "Squeeze14469", "BinaryOp14470", "BinaryOp14471", "/blocks.34/self_attn/Gather_5_output_0", "/blocks.34/self_attn/Div_1_output_0", "/blocks.34/self_attn/Unsqueeze_9_output_0", "/blocks.34/self_attn/Slice_3_output_0", "/blocks.34/self_attn/Neg_1_output_0", "/blocks.34/self_attn/Unsqueeze_8_output_0", "/blocks.34/self_attn/Slice_2_output_0", "/blocks.34/self_attn/Concat_4_output_0", "/blocks.34/self_attn/Mul_3_output_0", "/blocks.34/self_attn/Add_1_output_0", "/blocks.34/self_attn/v_proj/FakeLinear_output_0", "/blocks.34/self_attn/Unsqueeze_4_output_0", "/blocks.34/self_attn/Unsqueeze_5_output_0", "/blocks.34/self_attn/Concat_2_output_0", "/blocks.34/self_attn/Reshape_2_output_0", "/blocks.34/self_attn/Reshape_7_output_0", "/blocks.34/self_attn/o_proj/FakeLinear_output_0", "/blocks.34/Add_output_0", "/blocks.34/post_attention_layernorm/Mul_1_output_0", "/blocks.34/mlp/gate_proj/FakeLinear_output_0", "/blocks.34/mlp/act_fn/Mul_output_0", "/blocks.34/mlp/up_proj/FakeLinear_output_0", "/blocks.34/mlp/Mul_output_0", "/blocks.34/mlp/down_proj/FakeLinear_output_0", "/blocks.34/Add_1_output_0", "/blocks.35/Reshape_output_0", "/blocks.35/input_layernorm/Mul_1_output_0", "/blocks.35/self_attn/q_proj/FakeLinear_output_0", "/blocks.35/self_attn/Shape_output_0", "Shape14816", "Rank14818", "BinaryOp14820", "Unsqueeze14821", "BinaryOp14823", "Unsqueeze14824", "StridedSlice14827", "Squeeze14828", "BinaryOp14830", "/blocks.35/self_attn/Gather_output_0", "/blocks.35/self_attn/Unsqueeze_output_0", "Unsqueeze14838", "Unsqueeze14841", "StridedSlice14844", "Squeeze14845", "BinaryOp14846", "BinaryOp14847", "/blocks.35/self_attn/Gather_1_output_0", "/blocks.35/self_attn/Unsqueeze_1_output_0", "/blocks.35/self_attn/Concat_output_0", "/blocks.35/self_attn/Reshape_output_0", "/blocks.35/self_attn/q_norm/Cast_output_0", "/blocks.35/self_attn/q_norm/Mul_1_output_0", "Unsqueeze14865", "Unsqueeze14868", "StridedSlice14871", "Squeeze14872", "BinaryOp14874", "/blocks.35/self_attn/Gather_2_output_0", "/blocks.35/self_attn/Mul_output_0", "/blocks.35/self_attn/Shape_2_output_0", "Shape14966", "Rank14968", "BinaryOp14970", "Unsqueeze14971", "BinaryOp14973", "Unsqueeze14974", "StridedSlice14977", "Squeeze14978", "BinaryOp14979", "BinaryOp14980", "/blocks.35/self_attn/Gather_4_output_0", "/blocks.35/self_attn/Div_output_0", "/blocks.35/self_attn/Unsqueeze_7_output_0", "/blocks.35/self_attn/Slice_1_output_0", "/blocks.35/self_attn/Neg_output_0", "/blocks.35/self_attn/Unsqueeze_6_output_0", "/blocks.35/self_attn/Slice_output_0", "/blocks.35/self_attn/Concat_3_output_0", "Unsqueeze14907", "Unsqueeze14910", "StridedSlice14913", "Squeeze14914", "BinaryOp14915", "BinaryOp14916", "/blocks.35/self_attn/Gather_3_output_0", "/blocks.35/self_attn/Mul_1_output_0", "/blocks.35/self_attn/Add_output_0", "/blocks.35/self_attn/k_proj/FakeLinear_output_0", "/blocks.35/self_attn/Unsqueeze_2_output_0", "/blocks.35/self_attn/Unsqueeze_3_output_0", "/blocks.35/self_attn/Concat_1_output_0", "/blocks.35/self_attn/Reshape_1_output_0", "/blocks.35/self_attn/k_norm/Cast_output_0", "/blocks.35/self_attn/k_norm/Mul_1_output_0", "/blocks.35/self_attn/Mul_2_output_0", "/blocks.35/self_attn/Shape_3_output_0", "Shape14878", "Rank14880", "BinaryOp14882", "Unsqueeze14883", "BinaryOp14885", "Unsqueeze14886", "StridedSlice14889", "Squeeze14890", "BinaryOp14891", "BinaryOp14892", "/blocks.35/self_attn/Gather_5_output_0", "/blocks.35/self_attn/Div_1_output_0", "/blocks.35/self_attn/Unsqueeze_9_output_0", "/blocks.35/self_attn/Slice_3_output_0", "/blocks.35/self_attn/Neg_1_output_0", "/blocks.35/self_attn/Unsqueeze_8_output_0", "/blocks.35/self_attn/Slice_2_output_0", "/blocks.35/self_attn/Concat_4_output_0", "/blocks.35/self_attn/Mul_3_output_0", "/blocks.35/self_attn/Add_1_output_0", "/blocks.35/self_attn/v_proj/FakeLinear_output_0", "/blocks.35/self_attn/Unsqueeze_4_output_0", "/blocks.35/self_attn/Unsqueeze_5_output_0", "/blocks.35/self_attn/Concat_2_output_0", "/blocks.35/self_attn/Reshape_2_output_0", "/blocks.35/self_attn/Reshape_7_output_0", "/blocks.35/self_attn/o_proj/FakeLinear_output_0", "/blocks.35/Add_output_0", "/blocks.35/post_attention_layernorm/Mul_1_output_0", "/blocks.35/mlp/gate_proj/FakeLinear_output_0", "/blocks.35/mlp/act_fn/Mul_output_0", "/blocks.35/mlp/up_proj/FakeLinear_output_0", "/blocks.35/mlp/Mul_output_0", "/blocks.35/mlp/down_proj/FakeLinear_output_0", "/blocks.35/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/layers.30/self_attn/q_proj/Linear/pre_reshape", "/layers.30/self_attn/q_proj/Linear/pre_convert", "/layers.30/self_attn/q_proj/Linear", "/layers.30/self_attn/q_proj/Linear/post_convert", "/layers.30/self_attn/k_proj/Linear/pre_reshape", "/layers.30/self_attn/k_proj/Linear/pre_convert", "/layers.30/self_attn/k_proj/Linear", "/layers.30/self_attn/k_proj/Linear/post_convert", "/layers.30/self_attn/v_proj/Linear/pre_reshape", "/layers.30/self_attn/v_proj/Linear/pre_convert", "/layers.30/self_attn/v_proj/Linear", "/layers.30/self_attn/v_proj/Linear/post_convert", "/layers.30/self_attn/o_proj/Linear/pre_reshape", "/layers.30/self_attn/o_proj/Linear/pre_convert", "/layers.30/self_attn/o_proj/Linear", "/layers.30/self_attn/o_proj/Linear/post_convert", "/layers.30/mlp/gate_proj/Linear/pre_reshape", "/layers.30/mlp/gate_proj/Linear/pre_convert", "/layers.30/mlp/gate_proj/Linear", "/layers.30/mlp/gate_proj/Linear/post_convert", "/layers.30/mlp/up_proj/Linear/pre_reshape", "/layers.30/mlp/up_proj/Linear/pre_convert", "/layers.30/mlp/up_proj/Linear", "/layers.30/mlp/up_proj/Linear/post_convert", "/layers.30/mlp/down_proj/Linear/pre_reshape", "/layers.30/mlp/down_proj/Linear/pre_convert", "/layers.30/mlp/down_proj/Linear", "/layers.30/mlp/down_proj/Linear/post_convert", "/layers.31/self_attn/q_proj/Linear/pre_reshape", "/layers.31/self_attn/q_proj/Linear/pre_convert", "/layers.31/self_attn/q_proj/Linear", "/layers.31/self_attn/q_proj/Linear/post_convert", "/layers.31/self_attn/k_proj/Linear/pre_reshape", "/layers.31/self_attn/k_proj/Linear/pre_convert", "/layers.31/self_attn/k_proj/Linear", "/layers.31/self_attn/k_proj/Linear/post_convert", "/layers.31/self_attn/v_proj/Linear/pre_reshape", "/layers.31/self_attn/v_proj/Linear/pre_convert", "/layers.31/self_attn/v_proj/Linear", "/layers.31/self_attn/v_proj/Linear/post_convert", "/layers.31/self_attn/o_proj/Linear/pre_reshape", "/layers.31/self_attn/o_proj/Linear/pre_convert", "/layers.31/self_attn/o_proj/Linear", "/layers.31/self_attn/o_proj/Linear/post_convert", "/layers.31/mlp/gate_proj/Linear/pre_reshape", "/layers.31/mlp/gate_proj/Linear/pre_convert", "/layers.31/mlp/gate_proj/Linear", "/layers.31/mlp/gate_proj/Linear/post_convert", "/layers.31/mlp/up_proj/Linear/pre_reshape", "/layers.31/mlp/up_proj/Linear/pre_convert", "/layers.31/mlp/up_proj/Linear", "/layers.31/mlp/up_proj/Linear/post_convert", "/layers.31/mlp/down_proj/Linear/pre_reshape", "/layers.31/mlp/down_proj/Linear/pre_convert", "/layers.31/mlp/down_proj/Linear", "/layers.31/mlp/down_proj/Linear/post_convert", "/layers.32/self_attn/q_proj/Linear/pre_reshape", "/layers.32/self_attn/q_proj/Linear/pre_convert", "/layers.32/self_attn/q_proj/Linear", "/layers.32/self_attn/q_proj/Linear/post_convert", "/layers.32/self_attn/k_proj/Linear/pre_reshape", "/layers.32/self_attn/k_proj/Linear/pre_convert", "/layers.32/self_attn/k_proj/Linear", "/layers.32/self_attn/k_proj/Linear/post_convert", "/layers.32/self_attn/v_proj/Linear/pre_reshape", "/layers.32/self_attn/v_proj/Linear/pre_convert", "/layers.32/self_attn/v_proj/Linear", "/layers.32/self_attn/v_proj/Linear/post_convert", "/layers.32/self_attn/o_proj/Linear/pre_reshape", "/layers.32/self_attn/o_proj/Linear/pre_convert", "/layers.32/self_attn/o_proj/Linear", "/layers.32/self_attn/o_proj/Linear/post_convert", "/layers.32/mlp/gate_proj/Linear/pre_reshape", "/layers.32/mlp/gate_proj/Linear/pre_convert", "/layers.32/mlp/gate_proj/Linear", "/layers.32/mlp/gate_proj/Linear/post_convert", "/layers.32/mlp/up_proj/Linear/pre_reshape", "/layers.32/mlp/up_proj/Linear/pre_convert", "/layers.32/mlp/up_proj/Linear", "/layers.32/mlp/up_proj/Linear/post_convert", "/layers.32/mlp/down_proj/Linear/pre_reshape", "/layers.32/mlp/down_proj/Linear/pre_convert", "/layers.32/mlp/down_proj/Linear", "/layers.32/mlp/down_proj/Linear/post_convert", "/layers.33/self_attn/q_proj/Linear/pre_reshape", "/layers.33/self_attn/q_proj/Linear/pre_convert", "/layers.33/self_attn/q_proj/Linear", "/layers.33/self_attn/q_proj/Linear/post_convert", "/layers.33/self_attn/k_proj/Linear/pre_reshape", "/layers.33/self_attn/k_proj/Linear/pre_convert", "/layers.33/self_attn/k_proj/Linear", "/layers.33/self_attn/k_proj/Linear/post_convert", "/layers.33/self_attn/v_proj/Linear/pre_reshape", "/layers.33/self_attn/v_proj/Linear/pre_convert", "/layers.33/self_attn/v_proj/Linear", "/layers.33/self_attn/v_proj/Linear/post_convert", "/layers.33/self_attn/o_proj/Linear/pre_reshape", "/layers.33/self_attn/o_proj/Linear/pre_convert", "/layers.33/self_attn/o_proj/Linear", "/layers.33/self_attn/o_proj/Linear/post_convert", "/layers.33/mlp/gate_proj/Linear/pre_reshape", "/layers.33/mlp/gate_proj/Linear/pre_convert", "/layers.33/mlp/gate_proj/Linear", "/layers.33/mlp/gate_proj/Linear/post_convert", "/layers.33/mlp/up_proj/Linear/pre_reshape", "/layers.33/mlp/up_proj/Linear/pre_convert", "/layers.33/mlp/up_proj/Linear", "/layers.33/mlp/up_proj/Linear/post_convert", "/layers.33/mlp/down_proj/Linear/pre_reshape", "/layers.33/mlp/down_proj/Linear/pre_convert", "/layers.33/mlp/down_proj/Linear", "/layers.33/mlp/down_proj/Linear/post_convert", "/layers.34/self_attn/q_proj/Linear/pre_reshape", "/layers.34/self_attn/q_proj/Linear/pre_convert", "/layers.34/self_attn/q_proj/Linear", "/layers.34/self_attn/q_proj/Linear/post_convert", "/layers.34/self_attn/k_proj/Linear/pre_reshape", "/layers.34/self_attn/k_proj/Linear/pre_convert", "/layers.34/self_attn/k_proj/Linear", "/layers.34/self_attn/k_proj/Linear/post_convert", "/layers.34/self_attn/v_proj/Linear/pre_reshape", "/layers.34/self_attn/v_proj/Linear/pre_convert", "/layers.34/self_attn/v_proj/Linear", "/layers.34/self_attn/v_proj/Linear/post_convert", "/layers.34/self_attn/o_proj/Linear/pre_reshape", "/layers.34/self_attn/o_proj/Linear/pre_convert", "/layers.34/self_attn/o_proj/Linear", "/layers.34/self_attn/o_proj/Linear/post_convert", "/layers.34/mlp/gate_proj/Linear/pre_reshape", "/layers.34/mlp/gate_proj/Linear/pre_convert", "/layers.34/mlp/gate_proj/Linear", "/layers.34/mlp/gate_proj/Linear/post_convert", "/layers.34/mlp/up_proj/Linear/pre_reshape", "/layers.34/mlp/up_proj/Linear/pre_convert", "/layers.34/mlp/up_proj/Linear", "/layers.34/mlp/up_proj/Linear/post_convert", "/layers.34/mlp/down_proj/Linear/pre_reshape", "/layers.34/mlp/down_proj/Linear/pre_convert", "/layers.34/mlp/down_proj/Linear", "/layers.34/mlp/down_proj/Linear/post_convert", "/layers.35/self_attn/q_proj/Linear/pre_reshape", "/layers.35/self_attn/q_proj/Linear/pre_convert", "/layers.35/self_attn/q_proj/Linear", "/layers.35/self_attn/q_proj/Linear/post_convert", "/layers.35/self_attn/k_proj/Linear/pre_reshape", "/layers.35/self_attn/k_proj/Linear/pre_convert", "/layers.35/self_attn/k_proj/Linear", "/layers.35/self_attn/k_proj/Linear/post_convert", "/layers.35/self_attn/v_proj/Linear/pre_reshape", "/layers.35/self_attn/v_proj/Linear/pre_convert", "/layers.35/self_attn/v_proj/Linear", "/layers.35/self_attn/v_proj/Linear/post_convert", "/layers.35/self_attn/o_proj/Linear/pre_reshape", "/layers.35/self_attn/o_proj/Linear/pre_convert", "/layers.35/self_attn/o_proj/Linear", "/layers.35/self_attn/o_proj/Linear/post_convert", "/layers.35/mlp/gate_proj/Linear/pre_reshape", "/layers.35/mlp/gate_proj/Linear/pre_convert", "/layers.35/mlp/gate_proj/Linear", "/layers.35/mlp/gate_proj/Linear/post_convert", "/layers.35/mlp/up_proj/Linear/pre_reshape", "/layers.35/mlp/up_proj/Linear/pre_convert", "/layers.35/mlp/up_proj/Linear", "/layers.35/mlp/up_proj/Linear/post_convert", "/layers.35/mlp/down_proj/Linear/pre_reshape", "/layers.35/mlp/down_proj/Linear/pre_convert", "/layers.35/mlp/down_proj/Linear", "/layers.35/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "7ed4cb0a-da66-443a-86c5-94b1aead96e0" }