{ "bizCode": "MNNTest", "extraInfo": { "version": "3.4.0" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 1024 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 128 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 1 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 1024 ] } , "name": "/blocks.0/Constant_output_0", "outputIndexes": [ 3 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/Reshape_output_0", "outputIndexes": [ 4 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 0, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": [ 5 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2653 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2654 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8192, 1048598, 131072, 0, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 2655 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2655 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2656 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": [ 7 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Shape22", "outputIndexes": [ 8 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Rank24", "outputIndexes": [ 9 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 9 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp26", "outputIndexes": [ 10 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze27", "outputIndexes": [ 11 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const28", "outputIndexes": [ 12 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp29", "outputIndexes": [ 13 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze30", "outputIndexes": [ 14 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze32", "outputIndexes": [ 15 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 11, 14, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice33", "outputIndexes": [ 16 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 16 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze34", "outputIndexes": [ 17 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 17, 17 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp36", "outputIndexes": [ 18 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 18, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": [ 19 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_3_output_0", "outputIndexes": [ 20 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": [ 21 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze46", "outputIndexes": [ 22 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze49", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 22, 23, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice52", "outputIndexes": [ 24 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 24 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze53", "outputIndexes": [ 25 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 25 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp54", "outputIndexes": [ 26 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26, 25 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp55", "outputIndexes": [ 27 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 27, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": [ 28 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 29 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 16 ] } , "name": "/blocks.0/self_attn/Constant_2_output_0", "outputIndexes": [ 30 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 128 ] } , "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": [ 31 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 29, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": [ 32 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 32 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": [ 33 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1187862, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.0/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 35 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 36 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 2 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1, 1 ] } , "name": "/rotary/Constant_output_0", "outputIndexes": [ 37 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 36, 37 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/rotary/Reshape_output_0", "outputIndexes": [ 38 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 64 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.805842, 0.649382, 0.523299, 0.421697, 0.339821, 0.273842, 0.220673, 0.177828, 0.143301, 0.115478, 0.093057, 0.074989, 0.06043, 0.048697, 0.039242, 0.031623, 0.025483, 0.020535, 0.016548, 0.013335, 0.010746, 0.00866, 0.006978, 0.005623, 0.004532, 0.003652, 0.002943, 0.002371, 0.001911, 0.00154, 0.001241, 0.001, 0.000806, 0.000649, 0.000523, 0.000422, 0.00034, 0.000274, 0.000221, 0.000178, 0.000143, 0.000115, 0.000093, 0.000075, 0.00006, 0.000049, 0.000039, 0.000032, 0.000025, 0.000021, 0.000017, 0.000013, 0.000011, 0.000009, 0.000007, 0.000006, 0.000005, 0.000004, 0.000003, 0.000002, 0.000002, 0.000002, 0.000001 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 39 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38, 39 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 40 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 41 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 42 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 43 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 44 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42, 44 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 45 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45, 45 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 46 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_5_output_0", "outputIndexes": [ 47 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 46, 47 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 48 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 15 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 49 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49 ] , "main_type": "NONE", "name": "Shape85", "outputIndexes": [ 50 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 49 ] , "main_type": "NONE", "name": "Rank87", "outputIndexes": [ 51 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51, 51 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp89", "outputIndexes": [ 52 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze90", "outputIndexes": [ 53 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp92", "outputIndexes": [ 54 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze93", "outputIndexes": [ 55 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 53, 55, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice96", "outputIndexes": [ 56 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze97", "outputIndexes": [ 57 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 57, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp99", "outputIndexes": [ 58 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 58, 52 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": [ 59 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": [ 60 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": [ 61 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_8_output_0", "outputIndexes": [ 62 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61 ] , "main_type": "NONE", "name": "Shape104", "outputIndexes": [ 63 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 61 ] , "main_type": "NONE", "name": "Rank106", "outputIndexes": [ 64 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 64, 64 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp108", "outputIndexes": [ 65 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze109", "outputIndexes": [ 66 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp111", "outputIndexes": [ 67 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 67 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze112", "outputIndexes": [ 68 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 63, 66, 68, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice115", "outputIndexes": [ 69 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze116", "outputIndexes": [ 70 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 70 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp117", "outputIndexes": [ 71 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 71, 70 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp118", "outputIndexes": [ 72 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 72, 65 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": [ 73 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/blocks.0/self_attn/Constant_9_output_0", "outputIndexes": [ 74 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": [ 75 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 76 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/blocks.0/self_attn/Constant_16_output_0", "outputIndexes": [ 77 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_10_output_0", "outputIndexes": [ 78 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 76, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": [ 79 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 79 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": [ 80 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 81 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 20, 81, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": [ 82 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 80, 82 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": [ 83 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze136", "outputIndexes": [ 84 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze139", "outputIndexes": [ 85 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 84, 85, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice142", "outputIndexes": [ 86 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 86 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze143", "outputIndexes": [ 87 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 87 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp144", "outputIndexes": [ 88 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 88, 87 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp145", "outputIndexes": [ 89 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 89, 52 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": [ 90 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 83, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": [ 91 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 91 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": [ 92 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1188886, 524310, 65536, 0, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 2659 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2659 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2660 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2660 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 93 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 94 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 95 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 8 ] } , "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": [ 96 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 95, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": [ 97 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 93, 97 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": [ 98 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1778732, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.0/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 100 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": [ 101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": [ 102 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 102 ] , "main_type": "NONE", "name": "Shape166", "outputIndexes": [ 103 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 102 ] , "main_type": "NONE", "name": "Rank168", "outputIndexes": [ 104 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 104, 104 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp170", "outputIndexes": [ 105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze171", "outputIndexes": [ 106 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp173", "outputIndexes": [ 107 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 107 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze174", "outputIndexes": [ 108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103, 106, 108, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice177", "outputIndexes": [ 109 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze178", "outputIndexes": [ 110 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 110 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp179", "outputIndexes": [ 111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 111, 110 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp180", "outputIndexes": [ 112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 102, 112, 105 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": [ 113 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 113, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": [ 114 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 115, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": [ 116 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 116 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": [ 117 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 118 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 20, 118, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": [ 119 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 117, 119 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": [ 120 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 120, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": [ 121 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101, 121 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": [ 122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1779756, 524310, 65536, 0, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 2663 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2664 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2664 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 123 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 124 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 124, 125, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": [ 126 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 123, 126 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": [ 127 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 122, 127, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.0/self_attn/FusedAttention", "outputIndexes": [ 129 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2666 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2666 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2369602, 1048598, 131072, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 2667 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2667 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2668 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2668 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 130 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 130 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_output_0", "outputIndexes": [ 131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 3549272, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 132 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 132 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2669 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2670 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2670 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3557464, 1572886, 196608, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 2671 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2672 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2672 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 133 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 133 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": [ 134 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2670 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 5326958, 1572886, 196608, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 2675 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2675 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2676 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2676 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 134, 135 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": [ 136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2677 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2677 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2678 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 7096452, 1572886, 196608, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 2679 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2680 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131, 137 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_1_output_0", "outputIndexes": [ 138 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/Reshape_output_0", "outputIndexes": [ 139 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 8865946, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": [ 140 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2681 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2681 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2682 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8874138, 1048598, 131072, 0, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 2683 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2683 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2684 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2684 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 141 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": [ 142 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 142 ] , "main_type": "NONE", "name": "Shape228", "outputIndexes": [ 143 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 142 ] , "main_type": "NONE", "name": "Rank230", "outputIndexes": [ 144 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 144, 144 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp232", "outputIndexes": [ 145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze233", "outputIndexes": [ 146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp235", "outputIndexes": [ 147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze236", "outputIndexes": [ 148 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143, 146, 148, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice239", "outputIndexes": [ 149 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze240", "outputIndexes": [ 150 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 150, 150 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp242", "outputIndexes": [ 151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 142, 151, 145 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": [ 152 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": [ 153 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze250", "outputIndexes": [ 154 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze253", "outputIndexes": [ 155 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143, 154, 155, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice256", "outputIndexes": [ 156 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze257", "outputIndexes": [ 157 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 157 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp258", "outputIndexes": [ 158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 158, 157 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp259", "outputIndexes": [ 159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 142, 159, 145 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": [ 160 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 161 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 153, 161, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": [ 162 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141, 162 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": [ 163 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 163 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 10053808, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.1/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 165 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": [ 166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": [ 167 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 167 ] , "main_type": "NONE", "name": "Shape274", "outputIndexes": [ 168 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 167 ] , "main_type": "NONE", "name": "Rank276", "outputIndexes": [ 169 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169, 169 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp278", "outputIndexes": [ 170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze279", "outputIndexes": [ 171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp281", "outputIndexes": [ 172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze282", "outputIndexes": [ 173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 168, 171, 173, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice285", "outputIndexes": [ 174 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 174 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze286", "outputIndexes": [ 175 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp287", "outputIndexes": [ 176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 176, 175 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp288", "outputIndexes": [ 177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 167, 177, 170 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": [ 178 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 178, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": [ 179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 180 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165, 180, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": [ 181 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 181 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": [ 182 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165, 20, 183, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": [ 184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182, 184 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": [ 185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 185, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": [ 186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 166, 186 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": [ 187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 10054832, 524310, 65536, 0, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 2687 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2688 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2688 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 190, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": [ 191 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 191 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": [ 192 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 192 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 10644678, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.1/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 194 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 194, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": [ 195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 194 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": [ 196 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 196 ] , "main_type": "NONE", "name": "Shape316", "outputIndexes": [ 197 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 196 ] , "main_type": "NONE", "name": "Rank318", "outputIndexes": [ 198 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 198, 198 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp320", "outputIndexes": [ 199 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze321", "outputIndexes": [ 200 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp323", "outputIndexes": [ 201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 201 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze324", "outputIndexes": [ 202 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 197, 200, 202, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice327", "outputIndexes": [ 203 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze328", "outputIndexes": [ 204 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 204 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp329", "outputIndexes": [ 205 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 205, 204 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp330", "outputIndexes": [ 206 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 196, 206, 199 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": [ 207 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 207, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": [ 208 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 209 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 194, 209, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": [ 210 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 210 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": [ 211 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 194, 20, 212, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": [ 213 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 213 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": [ 214 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 214, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": [ 215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195, 215 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": [ 216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 10645702, 524310, 65536, 0, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 2691 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2692 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2692 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 217 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 218 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218, 219, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": [ 220 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 217, 220 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": [ 221 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 187, 216, 221, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.1/self_attn/FusedAttention", "outputIndexes": [ 222 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 222 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2694 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2694 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 11235548, 1048598, 131072, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 2695 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2695 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2696 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2696 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 223 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 223 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_output_0", "outputIndexes": [ 224 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 12415218, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 225 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2697 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2697 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2698 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2698 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 12423410, 1572886, 196608, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 2699 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2699 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2700 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 226 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 226 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": [ 227 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2698 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 14192904, 1572886, 196608, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 2703 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2703 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2704 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2704 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 228 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227, 228 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": [ 229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 229 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2705 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2705 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2706 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2706 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 15962398, 1572886, 196608, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 2707 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2707 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2708 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 230 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224, 230 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_1_output_0", "outputIndexes": [ 231 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 231, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/Reshape_output_0", "outputIndexes": [ 232 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 17731892, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": [ 233 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 233 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2709 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2709 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2710 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 17740084, 1048598, 131072, 0, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 2711 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2711 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2712 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2712 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 234 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 233 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": [ 235 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 235 ] , "main_type": "NONE", "name": "Shape377", "outputIndexes": [ 236 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 235 ] , "main_type": "NONE", "name": "Rank379", "outputIndexes": [ 237 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 237 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp381", "outputIndexes": [ 238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze382", "outputIndexes": [ 239 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp384", "outputIndexes": [ 240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze385", "outputIndexes": [ 241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 236, 239, 241, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice388", "outputIndexes": [ 242 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 242 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze389", "outputIndexes": [ 243 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 243, 243 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp391", "outputIndexes": [ 244 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235, 244, 238 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": [ 245 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": [ 246 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze399", "outputIndexes": [ 247 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze402", "outputIndexes": [ 248 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 236, 247, 248, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice405", "outputIndexes": [ 249 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 249 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze406", "outputIndexes": [ 250 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 250 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp407", "outputIndexes": [ 251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 250 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp408", "outputIndexes": [ 252 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235, 252, 238 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": [ 253 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 254 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 246, 254, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": [ 255 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234, 255 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": [ 256 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 256 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 18919754, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.2/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 258 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 258, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": [ 259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 258 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": [ 260 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 260 ] , "main_type": "NONE", "name": "Shape423", "outputIndexes": [ 261 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 260 ] , "main_type": "NONE", "name": "Rank425", "outputIndexes": [ 262 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 262 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp427", "outputIndexes": [ 263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 263 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze428", "outputIndexes": [ 264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 263, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp430", "outputIndexes": [ 265 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 265 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze431", "outputIndexes": [ 266 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 261, 264, 266, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice434", "outputIndexes": [ 267 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 267 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze435", "outputIndexes": [ 268 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 268 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp436", "outputIndexes": [ 269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 269, 268 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp437", "outputIndexes": [ 270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 260, 270, 263 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": [ 271 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 271, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": [ 272 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 273 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 258, 273, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": [ 274 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 274 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": [ 275 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 276 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 258, 20, 276, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": [ 277 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 277 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": [ 278 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 278, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": [ 279 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 259, 279 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": [ 280 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 18920778, 524310, 65536, 0, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 2715 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2716 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2716 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 281 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 282 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 283 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282, 283, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": [ 284 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 281, 284 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": [ 285 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 285 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 19510624, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.2/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 287 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": [ 288 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": [ 289 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 289 ] , "main_type": "NONE", "name": "Shape465", "outputIndexes": [ 290 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 289 ] , "main_type": "NONE", "name": "Rank467", "outputIndexes": [ 291 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291, 291 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp469", "outputIndexes": [ 292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 292 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze470", "outputIndexes": [ 293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 292, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp472", "outputIndexes": [ 294 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 294 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze473", "outputIndexes": [ 295 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 290, 293, 295, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice476", "outputIndexes": [ 296 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 296 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze477", "outputIndexes": [ 297 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 297 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp478", "outputIndexes": [ 298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 298, 297 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp479", "outputIndexes": [ 299 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 299, 292 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": [ 300 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 300, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": [ 301 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 301, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 302 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287, 302, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": [ 303 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 303 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": [ 304 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 301, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 305 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287, 20, 305, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": [ 306 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 304, 306 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": [ 307 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": [ 308 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288, 308 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": [ 309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19511648, 524310, 65536, 0, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 2719 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2720 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 310 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 311 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 312 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 311, 312, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": [ 313 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310, 313 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": [ 314 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280, 309, 314, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.2/self_attn/FusedAttention", "outputIndexes": [ 315 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2721 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2722 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20101494, 1048598, 131072, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 2723 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2723 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2724 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232, 316 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_output_0", "outputIndexes": [ 317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 21281164, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 318 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2725 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2725 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2726 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 21289356, 1572886, 196608, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 2727 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2727 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2728 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2728 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 319 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": [ 320 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 23058850, 1572886, 196608, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 2731 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2731 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2732 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2732 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 321 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 320, 321 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": [ 322 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 322 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2734 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2734 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 24828344, 1572886, 196608, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 2735 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2736 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2736 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 323 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 323 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_1_output_0", "outputIndexes": [ 324 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 324, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/Reshape_output_0", "outputIndexes": [ 325 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 325 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 26597838, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": [ 326 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2737 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2738 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 26606030, 1048598, 131072, 0, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 2739 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2740 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 327 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": [ 328 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 328 ] , "main_type": "NONE", "name": "Shape526", "outputIndexes": [ 329 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 328 ] , "main_type": "NONE", "name": "Rank528", "outputIndexes": [ 330 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 330, 330 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp530", "outputIndexes": [ 331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze531", "outputIndexes": [ 332 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp533", "outputIndexes": [ 333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 333 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze534", "outputIndexes": [ 334 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 329, 332, 334, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice537", "outputIndexes": [ 335 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 335 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze538", "outputIndexes": [ 336 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 336, 336 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp540", "outputIndexes": [ 337 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 337, 331 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": [ 338 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": [ 339 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze548", "outputIndexes": [ 340 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 333 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze551", "outputIndexes": [ 341 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 329, 340, 341, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice554", "outputIndexes": [ 342 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze555", "outputIndexes": [ 343 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 343 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp556", "outputIndexes": [ 344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 344, 343 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp557", "outputIndexes": [ 345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 328, 345, 331 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": [ 346 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 347 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 347, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": [ 348 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 327, 348 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": [ 349 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 349 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 27785700, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.3/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 351 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": [ 352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": [ 353 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 353 ] , "main_type": "NONE", "name": "Shape572", "outputIndexes": [ 354 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 353 ] , "main_type": "NONE", "name": "Rank574", "outputIndexes": [ 355 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 355, 355 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp576", "outputIndexes": [ 356 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 356 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze577", "outputIndexes": [ 357 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 356, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp579", "outputIndexes": [ 358 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 358 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze580", "outputIndexes": [ 359 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 354, 357, 359, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice583", "outputIndexes": [ 360 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 360 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze584", "outputIndexes": [ 361 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 361 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp585", "outputIndexes": [ 362 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 362, 361 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp586", "outputIndexes": [ 363 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 353, 363, 356 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": [ 364 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": [ 365 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 365, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 366 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 366, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": [ 367 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 367 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": [ 368 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 365, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 20, 369, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": [ 370 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 370 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": [ 371 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": [ 372 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 352, 372 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": [ 373 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 27786724, 524310, 65536, 0, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 2743 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2743 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2744 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 374 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 375 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 375, 376, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": [ 377 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 374, 377 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": [ 378 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 28376570, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.3/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 380 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": [ 381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": [ 382 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 382 ] , "main_type": "NONE", "name": "Shape614", "outputIndexes": [ 383 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 382 ] , "main_type": "NONE", "name": "Rank616", "outputIndexes": [ 384 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384, 384 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp618", "outputIndexes": [ 385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 385 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze619", "outputIndexes": [ 386 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 385, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp621", "outputIndexes": [ 387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 387 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze622", "outputIndexes": [ 388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 383, 386, 388, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice625", "outputIndexes": [ 389 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 389 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze626", "outputIndexes": [ 390 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 390 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp627", "outputIndexes": [ 391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 391, 390 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp628", "outputIndexes": [ 392 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 382, 392, 385 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": [ 393 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 393, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": [ 394 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 395 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 395, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": [ 396 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": [ 397 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 398 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 20, 398, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": [ 399 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 399 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": [ 400 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 400, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": [ 401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 401 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": [ 402 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28377594, 524310, 65536, 0, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 2747 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2748 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2748 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 403 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 404 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 405 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404, 405, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": [ 406 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403, 406 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": [ 407 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 373, 402, 407, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.3/self_attn/FusedAttention", "outputIndexes": [ 408 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2750 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2750 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28967440, 1048598, 131072, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 2751 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2751 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2752 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2752 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 325, 409 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_output_0", "outputIndexes": [ 410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 30147110, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 411 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 411 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2753 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2753 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2754 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2754 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 30155302, 1572886, 196608, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 2755 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2756 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 412 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": [ 413 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2754 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31924796, 1572886, 196608, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 2759 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2759 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2760 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2760 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 414 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 413, 414 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": [ 415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2761 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2761 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2762 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 33694290, 1572886, 196608, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 2763 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2763 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2764 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 416 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410, 416 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_1_output_0", "outputIndexes": [ 417 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/Reshape_output_0", "outputIndexes": [ 418 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 418 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 35463784, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": [ 419 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 419 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2765 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2765 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2766 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 35471976, 1048598, 131072, 0, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 2767 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2768 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2768 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 420 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 419 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": [ 421 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 421 ] , "main_type": "NONE", "name": "Shape675", "outputIndexes": [ 422 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 421 ] , "main_type": "NONE", "name": "Rank677", "outputIndexes": [ 423 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 423 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp679", "outputIndexes": [ 424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze680", "outputIndexes": [ 425 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp682", "outputIndexes": [ 426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze683", "outputIndexes": [ 427 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 422, 425, 427, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice686", "outputIndexes": [ 428 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze687", "outputIndexes": [ 429 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 429, 429 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp689", "outputIndexes": [ 430 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421, 430, 424 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": [ 431 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": [ 432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze697", "outputIndexes": [ 433 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze700", "outputIndexes": [ 434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 422, 433, 434, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice703", "outputIndexes": [ 435 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 435 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze704", "outputIndexes": [ 436 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 436 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp705", "outputIndexes": [ 437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437, 436 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp706", "outputIndexes": [ 438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421, 438, 424 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": [ 439 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 440 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 432, 440, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": [ 441 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 420, 441 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": [ 442 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 36651646, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.4/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 444 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": [ 445 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": [ 446 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 446 ] , "main_type": "NONE", "name": "Shape721", "outputIndexes": [ 447 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 446 ] , "main_type": "NONE", "name": "Rank723", "outputIndexes": [ 448 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 448, 448 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp725", "outputIndexes": [ 449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 449 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze726", "outputIndexes": [ 450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 449, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp728", "outputIndexes": [ 451 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 451 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze729", "outputIndexes": [ 452 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 447, 450, 452, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice732", "outputIndexes": [ 453 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze733", "outputIndexes": [ 454 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 454 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp734", "outputIndexes": [ 455 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 454 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp735", "outputIndexes": [ 456 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 446, 456, 449 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": [ 457 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 457, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": [ 458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 459 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444, 459, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": [ 460 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": [ 461 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 462 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444, 20, 462, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": [ 463 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 461, 463 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": [ 464 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": [ 465 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 445, 465 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": [ 466 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 36652670, 524310, 65536, 0, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 2771 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2772 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 467 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 469 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 468, 469, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": [ 470 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 470 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": [ 471 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 471 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 37242516, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.4/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 473 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": [ 474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": [ 475 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 475 ] , "main_type": "NONE", "name": "Shape763", "outputIndexes": [ 476 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 475 ] , "main_type": "NONE", "name": "Rank765", "outputIndexes": [ 477 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 477, 477 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp767", "outputIndexes": [ 478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze768", "outputIndexes": [ 479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp770", "outputIndexes": [ 480 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 480 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze771", "outputIndexes": [ 481 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 476, 479, 481, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice774", "outputIndexes": [ 482 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 482 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze775", "outputIndexes": [ 483 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 483 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp776", "outputIndexes": [ 484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 484, 483 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp777", "outputIndexes": [ 485 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 475, 485, 478 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": [ 486 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 486, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": [ 487 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 488 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473, 488, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": [ 489 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 489 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": [ 490 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473, 20, 491, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": [ 492 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 492 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": [ 493 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 493, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": [ 494 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 474, 494 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": [ 495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37243540, 524310, 65536, 0, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 2775 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2776 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2776 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 497 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 498, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": [ 499 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 499 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": [ 500 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 466, 495, 500, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.4/self_attn/FusedAttention", "outputIndexes": [ 501 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2777 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2777 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2778 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37833386, 1048598, 131072, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 2779 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2779 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2780 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2780 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 502 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 418, 502 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_output_0", "outputIndexes": [ 503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 39013056, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 504 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2781 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2781 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2782 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2782 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 39021248, 1572886, 196608, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 2783 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2783 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2784 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2784 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 505 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 505 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": [ 506 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2782 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 40790742, 1572886, 196608, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 2787 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2787 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2788 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2788 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 507 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 507 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": [ 508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 508 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2789 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2789 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2790 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2790 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 42560236, 1572886, 196608, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 2791 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2791 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2792 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2792 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 509 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503, 509 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_1_output_0", "outputIndexes": [ 510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/Reshape_output_0", "outputIndexes": [ 511 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 511 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 44329730, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": [ 512 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2793 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2793 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2794 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 44337922, 1048598, 131072, 0, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 2795 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2795 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2796 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2796 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 513 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": [ 514 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 514 ] , "main_type": "NONE", "name": "Shape824", "outputIndexes": [ 515 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 514 ] , "main_type": "NONE", "name": "Rank826", "outputIndexes": [ 516 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 516, 516 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp828", "outputIndexes": [ 517 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze829", "outputIndexes": [ 518 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp831", "outputIndexes": [ 519 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze832", "outputIndexes": [ 520 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 518, 520, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice835", "outputIndexes": [ 521 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 521 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze836", "outputIndexes": [ 522 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522, 522 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp838", "outputIndexes": [ 523 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 523, 517 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": [ 524 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": [ 525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze846", "outputIndexes": [ 526 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze849", "outputIndexes": [ 527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 526, 527, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice852", "outputIndexes": [ 528 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 528 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze853", "outputIndexes": [ 529 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 529 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp854", "outputIndexes": [ 530 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 530, 529 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp855", "outputIndexes": [ 531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 531, 517 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": [ 532 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 533 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 525, 533, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": [ 534 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 513, 534 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": [ 535 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 535 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 45517592, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.5/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 537 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": [ 538 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": [ 539 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 539 ] , "main_type": "NONE", "name": "Shape870", "outputIndexes": [ 540 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 539 ] , "main_type": "NONE", "name": "Rank872", "outputIndexes": [ 541 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 541, 541 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp874", "outputIndexes": [ 542 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze875", "outputIndexes": [ 543 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp877", "outputIndexes": [ 544 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze878", "outputIndexes": [ 545 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 540, 543, 545, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice881", "outputIndexes": [ 546 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze882", "outputIndexes": [ 547 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 547 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp883", "outputIndexes": [ 548 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 548, 547 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp884", "outputIndexes": [ 549 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 539, 549, 542 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": [ 550 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 550, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": [ 551 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 551, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 552 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 552, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": [ 553 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 553 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": [ 554 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 551, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 555 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 20, 555, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": [ 556 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 554, 556 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": [ 557 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 557, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": [ 558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 538, 558 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": [ 559 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 45518616, 524310, 65536, 0, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 2799 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2800 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2800 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 560 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 561 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 562 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 561, 562, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": [ 563 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 560, 563 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": [ 564 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 564 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 46108462, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.5/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 566 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": [ 567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": [ 568 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 568 ] , "main_type": "NONE", "name": "Shape912", "outputIndexes": [ 569 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 568 ] , "main_type": "NONE", "name": "Rank914", "outputIndexes": [ 570 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570, 570 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp916", "outputIndexes": [ 571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze917", "outputIndexes": [ 572 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp919", "outputIndexes": [ 573 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze920", "outputIndexes": [ 574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 569, 572, 574, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice923", "outputIndexes": [ 575 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze924", "outputIndexes": [ 576 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 576 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp925", "outputIndexes": [ 577 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 577, 576 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp926", "outputIndexes": [ 578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 568, 578, 571 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": [ 579 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 579, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": [ 580 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 581 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 581, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": [ 582 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 582 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": [ 583 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 584 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 20, 584, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": [ 585 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 585 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": [ 586 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": [ 587 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 567, 587 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": [ 588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 46109486, 524310, 65536, 0, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 2803 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2804 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 589 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 590 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 590, 591, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": [ 592 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 589, 592 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": [ 593 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 559, 588, 593, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.5/self_attn/FusedAttention", "outputIndexes": [ 594 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 594 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2806 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 46699332, 1048598, 131072, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 2807 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2808 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 595 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 511, 595 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_output_0", "outputIndexes": [ 596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 47879002, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 597 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 597 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2809 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2810 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47887194, 1572886, 196608, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 2811 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2812 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2812 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 598 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 598 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": [ 599 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 49656688, 1572886, 196608, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 2815 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2816 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2816 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 600 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 599, 600 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": [ 601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2817 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2817 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2818 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 51426182, 1572886, 196608, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 2819 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2820 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2820 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 602 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596, 602 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_1_output_0", "outputIndexes": [ 603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/Reshape_output_0", "outputIndexes": [ 604 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 53195676, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": [ 605 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 605 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2821 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2821 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2822 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2822 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 53203868, 1048598, 131072, 0, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 2823 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2823 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2824 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2824 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 605 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": [ 607 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 607 ] , "main_type": "NONE", "name": "Shape973", "outputIndexes": [ 608 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 607 ] , "main_type": "NONE", "name": "Rank975", "outputIndexes": [ 609 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609, 609 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp977", "outputIndexes": [ 610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze978", "outputIndexes": [ 611 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp980", "outputIndexes": [ 612 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 612 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze981", "outputIndexes": [ 613 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608, 611, 613, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice984", "outputIndexes": [ 614 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 614 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze985", "outputIndexes": [ 615 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 615, 615 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp987", "outputIndexes": [ 616 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 616, 610 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": [ 617 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": [ 618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze995", "outputIndexes": [ 619 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 612 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze998", "outputIndexes": [ 620 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608, 619, 620, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1001", "outputIndexes": [ 621 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 621 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1002", "outputIndexes": [ 622 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 622 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1003", "outputIndexes": [ 623 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 623, 622 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1004", "outputIndexes": [ 624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 624, 610 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": [ 625 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 626 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 626, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": [ 627 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 627 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": [ 628 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 54383538, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.6/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 630 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": [ 631 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": [ 632 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 632 ] , "main_type": "NONE", "name": "Shape1019", "outputIndexes": [ 633 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 632 ] , "main_type": "NONE", "name": "Rank1021", "outputIndexes": [ 634 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 634, 634 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1023", "outputIndexes": [ 635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1024", "outputIndexes": [ 636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1026", "outputIndexes": [ 637 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 637 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1027", "outputIndexes": [ 638 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 636, 638, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1030", "outputIndexes": [ 639 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 639 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1031", "outputIndexes": [ 640 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 640 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1032", "outputIndexes": [ 641 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 641, 640 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1033", "outputIndexes": [ 642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 632, 642, 635 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": [ 643 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 643, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": [ 644 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 645 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 645, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": [ 646 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 646 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": [ 647 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 648 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 20, 648, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": [ 649 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 647, 649 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": [ 650 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 650, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": [ 651 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 651 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": [ 652 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2822 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 54384562, 524310, 65536, 0, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 2827 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2827 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2828 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 653 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 654 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 654, 655, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": [ 656 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 653, 656 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": [ 657 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 657 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 54974408, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.6/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 659 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": [ 660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": [ 661 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 661 ] , "main_type": "NONE", "name": "Shape1061", "outputIndexes": [ 662 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 661 ] , "main_type": "NONE", "name": "Rank1063", "outputIndexes": [ 663 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663, 663 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1065", "outputIndexes": [ 664 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1066", "outputIndexes": [ 665 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1068", "outputIndexes": [ 666 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1069", "outputIndexes": [ 667 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 662, 665, 667, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1072", "outputIndexes": [ 668 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1073", "outputIndexes": [ 669 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 669 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1074", "outputIndexes": [ 670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670, 669 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1075", "outputIndexes": [ 671 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661, 671, 664 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": [ 672 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": [ 673 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 674 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659, 674, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": [ 675 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": [ 676 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659, 20, 677, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": [ 678 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 678 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": [ 679 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": [ 680 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 660, 680 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": [ 681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2822 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 54975432, 524310, 65536, 0, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 2831 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2832 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 682 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 683 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 684 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 683, 684, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": [ 685 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 685 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": [ 686 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 652, 681, 686, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.6/self_attn/FusedAttention", "outputIndexes": [ 687 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 687 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2833 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2834 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2834 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 55565278, 1048598, 131072, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 2835 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2835 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2836 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 688 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 688 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_output_0", "outputIndexes": [ 689 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 56744948, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 690 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2837 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2837 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2838 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2838 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56753140, 1572886, 196608, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 2839 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2839 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2840 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2840 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 691 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 691 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": [ 692 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2838 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 58522634, 1572886, 196608, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 2843 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2843 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2844 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2844 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 693 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": [ 694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2846 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2846 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 60292128, 1572886, 196608, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 2847 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2847 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2848 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2848 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 695 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689, 695 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_1_output_0", "outputIndexes": [ 696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 696, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/Reshape_output_0", "outputIndexes": [ 697 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 62061622, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": [ 698 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2849 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2850 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2850 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 62069814, 1048598, 131072, 0, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 2851 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2851 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2852 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2852 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 699 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": [ 700 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 700 ] , "main_type": "NONE", "name": "Shape1122", "outputIndexes": [ 701 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 700 ] , "main_type": "NONE", "name": "Rank1124", "outputIndexes": [ 702 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702, 702 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1126", "outputIndexes": [ 703 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1127", "outputIndexes": [ 704 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1129", "outputIndexes": [ 705 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 705 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1130", "outputIndexes": [ 706 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 701, 704, 706, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1133", "outputIndexes": [ 707 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1134", "outputIndexes": [ 708 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 708, 708 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1136", "outputIndexes": [ 709 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700, 709, 703 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": [ 710 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": [ 711 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1144", "outputIndexes": [ 712 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 705 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1147", "outputIndexes": [ 713 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 701, 712, 713, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1150", "outputIndexes": [ 714 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 714 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1151", "outputIndexes": [ 715 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 715 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1152", "outputIndexes": [ 716 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 716, 715 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1153", "outputIndexes": [ 717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700, 717, 703 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": [ 718 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 719 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 711, 719, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": [ 720 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 699, 720 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": [ 721 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 721 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 63249484, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.7/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 723 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": [ 724 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": [ 725 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 725 ] , "main_type": "NONE", "name": "Shape1168", "outputIndexes": [ 726 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 725 ] , "main_type": "NONE", "name": "Rank1170", "outputIndexes": [ 727 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727, 727 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1172", "outputIndexes": [ 728 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 728 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1173", "outputIndexes": [ 729 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 728, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1175", "outputIndexes": [ 730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 730 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1176", "outputIndexes": [ 731 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 726, 729, 731, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1179", "outputIndexes": [ 732 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 732 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1180", "outputIndexes": [ 733 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 733 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1181", "outputIndexes": [ 734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 733 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1182", "outputIndexes": [ 735 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725, 735, 728 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": [ 736 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": [ 737 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 737, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 738 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 738, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": [ 739 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 739 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": [ 740 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 737, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 741 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 20, 741, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": [ 742 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 740, 742 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": [ 743 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 743, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": [ 744 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 724, 744 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": [ 745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2850 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63250508, 524310, 65536, 0, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 2855 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2855 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2856 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 746 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 747 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 748 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 747, 748, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": [ 749 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 746, 749 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": [ 750 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 63840354, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.7/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 752 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": [ 753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": [ 754 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 754 ] , "main_type": "NONE", "name": "Shape1210", "outputIndexes": [ 755 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 754 ] , "main_type": "NONE", "name": "Rank1212", "outputIndexes": [ 756 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 756, 756 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1214", "outputIndexes": [ 757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1215", "outputIndexes": [ 758 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1217", "outputIndexes": [ 759 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1218", "outputIndexes": [ 760 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755, 758, 760, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1221", "outputIndexes": [ 761 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1222", "outputIndexes": [ 762 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 762 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1223", "outputIndexes": [ 763 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 763, 762 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1224", "outputIndexes": [ 764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 754, 764, 757 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": [ 765 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 765, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": [ 766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752, 767, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": [ 768 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 768 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": [ 769 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 770 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752, 20, 770, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": [ 771 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 771 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": [ 772 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 772, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": [ 773 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 753, 773 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": [ 774 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2850 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63841378, 524310, 65536, 0, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 2859 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2860 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2860 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 775 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 776 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 777 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 776, 777, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": [ 778 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 775, 778 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": [ 779 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 745, 774, 779, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.7/self_attn/FusedAttention", "outputIndexes": [ 780 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 780 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2861 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2862 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2862 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 64431224, 1048598, 131072, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 2863 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2863 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2864 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2864 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 781 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697, 781 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_output_0", "outputIndexes": [ 782 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 65610894, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 783 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2865 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2865 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2866 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2866 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65619086, 1572886, 196608, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 2867 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2867 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2868 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2868 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 784 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": [ 785 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2866 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 67388580, 1572886, 196608, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 2871 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2871 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2872 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2872 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 786 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 786 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": [ 787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2873 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2873 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2874 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2874 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 69158074, 1572886, 196608, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 2875 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2875 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2876 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2876 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 788 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 788 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_1_output_0", "outputIndexes": [ 789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/Reshape_output_0", "outputIndexes": [ 790 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 790 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 70927568, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": [ 791 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2877 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2877 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2878 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2878 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 70935760, 1048598, 131072, 0, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 2879 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2879 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2880 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2880 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 792 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": [ 793 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 793 ] , "main_type": "NONE", "name": "Shape1271", "outputIndexes": [ 794 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 793 ] , "main_type": "NONE", "name": "Rank1273", "outputIndexes": [ 795 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 795, 795 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1275", "outputIndexes": [ 796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1276", "outputIndexes": [ 797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1278", "outputIndexes": [ 798 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1279", "outputIndexes": [ 799 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 794, 797, 799, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1282", "outputIndexes": [ 800 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 800 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1283", "outputIndexes": [ 801 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 801, 801 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1285", "outputIndexes": [ 802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 802, 796 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": [ 803 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 803, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": [ 804 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1293", "outputIndexes": [ 805 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1296", "outputIndexes": [ 806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 794, 805, 806, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1299", "outputIndexes": [ 807 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 807 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1300", "outputIndexes": [ 808 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 808 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1301", "outputIndexes": [ 809 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 808 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1302", "outputIndexes": [ 810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 810, 796 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": [ 811 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 812 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 804, 812, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": [ 813 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 792, 813 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": [ 814 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 72115430, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.8/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 816 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": [ 817 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": [ 818 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 818 ] , "main_type": "NONE", "name": "Shape1317", "outputIndexes": [ 819 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 818 ] , "main_type": "NONE", "name": "Rank1319", "outputIndexes": [ 820 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820, 820 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1321", "outputIndexes": [ 821 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 821 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1322", "outputIndexes": [ 822 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 821, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1324", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 823 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1325", "outputIndexes": [ 824 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 819, 822, 824, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1328", "outputIndexes": [ 825 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1329", "outputIndexes": [ 826 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 826 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1330", "outputIndexes": [ 827 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 827, 826 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1331", "outputIndexes": [ 828 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818, 828, 821 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": [ 829 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 829, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": [ 830 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 830, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 831 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 831, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": [ 832 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 832 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": [ 833 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 830, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 834 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 20, 834, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": [ 835 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 833, 835 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": [ 836 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 836, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": [ 837 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 817, 837 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": [ 838 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2878 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 72116454, 524310, 65536, 0, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 2883 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2883 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2884 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2884 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 839 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 803, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 841 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 840, 841, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": [ 842 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839, 842 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": [ 843 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 843 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 72706300, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.8/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 845 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 845, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": [ 846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 845 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": [ 847 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 847 ] , "main_type": "NONE", "name": "Shape1359", "outputIndexes": [ 848 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 847 ] , "main_type": "NONE", "name": "Rank1361", "outputIndexes": [ 849 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 849 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1363", "outputIndexes": [ 850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1364", "outputIndexes": [ 851 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1366", "outputIndexes": [ 852 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1367", "outputIndexes": [ 853 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848, 851, 853, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1370", "outputIndexes": [ 854 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 854 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1371", "outputIndexes": [ 855 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 855 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1372", "outputIndexes": [ 856 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 856, 855 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1373", "outputIndexes": [ 857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 857, 850 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": [ 858 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 858, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": [ 859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 859, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 860 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 845, 860, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": [ 861 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 861 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": [ 862 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 859, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 845, 20, 863, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": [ 864 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 864 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": [ 865 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 865, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": [ 866 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 846, 866 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": [ 867 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2878 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 72707324, 524310, 65536, 0, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 2887 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2887 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2888 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2888 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 868 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 803, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 869 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 870 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 869, 870, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": [ 871 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 871 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": [ 872 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 838, 867, 872, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.8/self_attn/FusedAttention", "outputIndexes": [ 873 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2889 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2889 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2890 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2890 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 73297170, 1048598, 131072, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 2891 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2891 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2892 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2892 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 874 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 790, 874 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_output_0", "outputIndexes": [ 875 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 74476840, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 876 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2893 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2893 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2894 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2894 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 74485032, 1572886, 196608, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 2895 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2895 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2896 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2896 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 877 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 877 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": [ 878 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2894 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 76254526, 1572886, 196608, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 2899 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2900 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 879 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878, 879 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": [ 880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2901 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2902 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2902 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 78024020, 1572886, 196608, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 2903 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2904 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2904 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 881 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 881 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_1_output_0", "outputIndexes": [ 882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/Reshape_output_0", "outputIndexes": [ 883 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 883 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 79793514, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": [ 884 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2905 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2906 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2906 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79801706, 1048598, 131072, 0, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 2907 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2907 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2908 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2908 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 885 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": [ 886 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 886 ] , "main_type": "NONE", "name": "Shape1420", "outputIndexes": [ 887 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 886 ] , "main_type": "NONE", "name": "Rank1422", "outputIndexes": [ 888 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 888 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1424", "outputIndexes": [ 889 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1425", "outputIndexes": [ 890 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1427", "outputIndexes": [ 891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1428", "outputIndexes": [ 892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887, 890, 892, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1431", "outputIndexes": [ 893 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1432", "outputIndexes": [ 894 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 894, 894 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1434", "outputIndexes": [ 895 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886, 895, 889 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": [ 896 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 896, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": [ 897 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1442", "outputIndexes": [ 898 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1445", "outputIndexes": [ 899 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887, 898, 899, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1448", "outputIndexes": [ 900 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1449", "outputIndexes": [ 901 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 901 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1450", "outputIndexes": [ 902 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902, 901 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1451", "outputIndexes": [ 903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886, 903, 889 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": [ 904 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 905 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 897, 905, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": [ 906 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 906 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": [ 907 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 907 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 80981376, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.9/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 909 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": [ 910 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": [ 911 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 911 ] , "main_type": "NONE", "name": "Shape1466", "outputIndexes": [ 912 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 911 ] , "main_type": "NONE", "name": "Rank1468", "outputIndexes": [ 913 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 913, 913 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1470", "outputIndexes": [ 914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1471", "outputIndexes": [ 915 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1473", "outputIndexes": [ 916 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 916 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1474", "outputIndexes": [ 917 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 912, 915, 917, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1477", "outputIndexes": [ 918 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1478", "outputIndexes": [ 919 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 919 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1479", "outputIndexes": [ 920 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 920, 919 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1480", "outputIndexes": [ 921 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 921, 914 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": [ 922 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 922, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": [ 923 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 923, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 924 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 924, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": [ 925 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 925 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": [ 926 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 923, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 927 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 20, 927, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": [ 928 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 926, 928 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": [ 929 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 929, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": [ 930 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 910, 930 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": [ 931 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2906 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 80982400, 524310, 65536, 0, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 2911 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2911 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2912 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 932 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 896, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 933 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 934 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 933, 934, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": [ 935 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 932, 935 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": [ 936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 81572246, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.9/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 938 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": [ 939 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": [ 940 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 940 ] , "main_type": "NONE", "name": "Shape1508", "outputIndexes": [ 941 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 940 ] , "main_type": "NONE", "name": "Rank1510", "outputIndexes": [ 942 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 942 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1512", "outputIndexes": [ 943 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 943 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1513", "outputIndexes": [ 944 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 943, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1515", "outputIndexes": [ 945 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 945 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1516", "outputIndexes": [ 946 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 944, 946, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1519", "outputIndexes": [ 947 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 947 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1520", "outputIndexes": [ 948 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 948 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1521", "outputIndexes": [ 949 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 948 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1522", "outputIndexes": [ 950 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 950, 943 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": [ 951 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 951, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": [ 952 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 952, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 953 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 953, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": [ 954 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 954 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": [ 955 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 952, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 956 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 20, 956, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": [ 957 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 957 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": [ 958 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 958, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": [ 959 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939, 959 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": [ 960 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2906 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 81573270, 524310, 65536, 0, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 2915 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2915 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2916 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 961 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 896, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 962 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 963 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 963, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": [ 964 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 961, 964 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": [ 965 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931, 960, 965, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.9/self_attn/FusedAttention", "outputIndexes": [ 966 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 966 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2917 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2917 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2918 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2918 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 82163116, 1048598, 131072, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 2919 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2919 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2920 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2920 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 967 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 883, 967 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_output_0", "outputIndexes": [ 968 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 83342786, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 969 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2921 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2922 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2922 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 83350978, 1572886, 196608, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 2923 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2923 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2924 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2924 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 970 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 970 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": [ 971 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2922 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 85120472, 1572886, 196608, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 2927 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2927 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2928 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 972 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 971, 972 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": [ 973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2929 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2929 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2930 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2930 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 86889966, 1572886, 196608, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 2931 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2931 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2932 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2932 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 974 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968, 974 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_1_output_0", "outputIndexes": [ 975 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 975, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/Reshape_output_0", "outputIndexes": [ 976 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 88659460, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": [ 977 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2933 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2933 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2934 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 88667652, 1048598, 131072, 0, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 2935 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2935 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2936 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2936 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 978 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": [ 979 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 979 ] , "main_type": "NONE", "name": "Shape1569", "outputIndexes": [ 980 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 979 ] , "main_type": "NONE", "name": "Rank1571", "outputIndexes": [ 981 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 981, 981 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1573", "outputIndexes": [ 982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1574", "outputIndexes": [ 983 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1576", "outputIndexes": [ 984 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1577", "outputIndexes": [ 985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 980, 983, 985, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1580", "outputIndexes": [ 986 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 986 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1581", "outputIndexes": [ 987 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 987 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1583", "outputIndexes": [ 988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 979, 988, 982 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": [ 989 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": [ 990 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1591", "outputIndexes": [ 991 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1594", "outputIndexes": [ 992 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 980, 991, 992, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1597", "outputIndexes": [ 993 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 993 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1598", "outputIndexes": [ 994 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 994 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1599", "outputIndexes": [ 995 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 995, 994 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1600", "outputIndexes": [ 996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 979, 996, 982 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": [ 997 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 998 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 998, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": [ 999 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 978, 999 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": [ 1000 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1000 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 89847322, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.10/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1002 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": [ 1003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": [ 1004 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1004 ] , "main_type": "NONE", "name": "Shape1615", "outputIndexes": [ 1005 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1004 ] , "main_type": "NONE", "name": "Rank1617", "outputIndexes": [ 1006 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1006, 1006 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1619", "outputIndexes": [ 1007 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1007 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1620", "outputIndexes": [ 1008 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1007, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1622", "outputIndexes": [ 1009 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1009 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1623", "outputIndexes": [ 1010 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1005, 1008, 1010, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1626", "outputIndexes": [ 1011 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1011 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1627", "outputIndexes": [ 1012 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1012 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1628", "outputIndexes": [ 1013 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1013, 1012 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1629", "outputIndexes": [ 1014 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 1014, 1007 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": [ 1015 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1015, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": [ 1016 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1016, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1017 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 1017, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": [ 1018 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1018 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": [ 1019 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1016, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 20, 1020, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": [ 1021 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1019, 1021 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": [ 1022 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1022, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": [ 1023 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1003, 1023 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": [ 1024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 89848346, 524310, 65536, 0, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 2939 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2939 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2940 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2940 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1025 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1026 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1027 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026, 1027, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": [ 1028 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025, 1028 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": [ 1029 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 90438192, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.10/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1031 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": [ 1032 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": [ 1033 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1033 ] , "main_type": "NONE", "name": "Shape1657", "outputIndexes": [ 1034 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1033 ] , "main_type": "NONE", "name": "Rank1659", "outputIndexes": [ 1035 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035, 1035 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1661", "outputIndexes": [ 1036 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1662", "outputIndexes": [ 1037 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1664", "outputIndexes": [ 1038 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1665", "outputIndexes": [ 1039 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1034, 1037, 1039, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1668", "outputIndexes": [ 1040 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1669", "outputIndexes": [ 1041 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1041 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1670", "outputIndexes": [ 1042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1042, 1041 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1671", "outputIndexes": [ 1043 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033, 1043, 1036 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": [ 1044 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1044, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": [ 1045 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1045, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1046 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 1046, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": [ 1047 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1047 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": [ 1048 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1045, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1049 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 20, 1049, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": [ 1050 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 1050 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": [ 1051 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": [ 1052 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1032, 1052 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": [ 1053 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 90439216, 524310, 65536, 0, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 2943 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2943 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2944 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1054 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1056 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1055, 1056, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": [ 1057 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 1057 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": [ 1058 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1024, 1053, 1058, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.10/self_attn/FusedAttention", "outputIndexes": [ 1059 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2945 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2945 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2946 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2946 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 91029062, 1048598, 131072, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 2947 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2947 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2948 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2948 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1060 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976, 1060 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_output_0", "outputIndexes": [ 1061 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 92208732, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1062 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2949 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2949 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2950 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 92216924, 1572886, 196608, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 2951 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2951 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2952 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2952 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1063 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1064 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 93986418, 1572886, 196608, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 2955 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2955 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2956 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1065 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1064, 1065 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": [ 1066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2957 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2957 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2958 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2958 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 95755912, 1572886, 196608, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 2959 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2959 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2960 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2960 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1067 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061, 1067 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_1_output_0", "outputIndexes": [ 1068 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1068, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/Reshape_output_0", "outputIndexes": [ 1069 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1069 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 97525406, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1070 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1070 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2961 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2961 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2962 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2962 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 97533598, 1048598, 131072, 0, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 2963 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2963 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2964 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2964 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1071 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1070 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": [ 1072 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1072 ] , "main_type": "NONE", "name": "Shape1718", "outputIndexes": [ 1073 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1072 ] , "main_type": "NONE", "name": "Rank1720", "outputIndexes": [ 1074 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1074, 1074 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1722", "outputIndexes": [ 1075 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1723", "outputIndexes": [ 1076 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1725", "outputIndexes": [ 1077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1077 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1726", "outputIndexes": [ 1078 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 1076, 1078, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1729", "outputIndexes": [ 1079 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1079 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1730", "outputIndexes": [ 1080 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1080, 1080 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1732", "outputIndexes": [ 1081 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 1081, 1075 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": [ 1082 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1082, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1083 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1740", "outputIndexes": [ 1084 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1077 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1743", "outputIndexes": [ 1085 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 1084, 1085, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1746", "outputIndexes": [ 1086 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1086 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1747", "outputIndexes": [ 1087 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1087 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1748", "outputIndexes": [ 1088 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1088, 1087 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1749", "outputIndexes": [ 1089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 1089, 1075 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": [ 1090 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1091 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083, 1091, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": [ 1092 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1071, 1092 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": [ 1093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1093 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 98713268, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.11/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1095 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": [ 1096 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": [ 1097 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1097 ] , "main_type": "NONE", "name": "Shape1764", "outputIndexes": [ 1098 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1097 ] , "main_type": "NONE", "name": "Rank1766", "outputIndexes": [ 1099 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1099, 1099 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1768", "outputIndexes": [ 1100 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1769", "outputIndexes": [ 1101 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1771", "outputIndexes": [ 1102 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1102 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1772", "outputIndexes": [ 1103 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1098, 1101, 1103, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1775", "outputIndexes": [ 1104 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1104 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1776", "outputIndexes": [ 1105 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1105 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1777", "outputIndexes": [ 1106 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106, 1105 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1778", "outputIndexes": [ 1107 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1097, 1107, 1100 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": [ 1108 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": [ 1109 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1109, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1110 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095, 1110, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": [ 1111 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1111 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": [ 1112 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1109, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1113 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095, 20, 1113, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": [ 1114 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1112, 1114 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": [ 1115 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": [ 1116 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1096, 1116 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": [ 1117 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2962 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 98714292, 524310, 65536, 0, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 2967 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2968 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2968 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1118 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1082, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1119 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1120 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1119, 1120, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": [ 1121 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1121 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": [ 1122 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 99304138, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.11/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1124 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": [ 1125 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": [ 1126 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1126 ] , "main_type": "NONE", "name": "Shape1806", "outputIndexes": [ 1127 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1126 ] , "main_type": "NONE", "name": "Rank1808", "outputIndexes": [ 1128 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1128, 1128 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1810", "outputIndexes": [ 1129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1811", "outputIndexes": [ 1130 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1813", "outputIndexes": [ 1131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1814", "outputIndexes": [ 1132 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 1130, 1132, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1817", "outputIndexes": [ 1133 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1818", "outputIndexes": [ 1134 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1134 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1819", "outputIndexes": [ 1135 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 1134 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1820", "outputIndexes": [ 1136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1126, 1136, 1129 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": [ 1137 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1137, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": [ 1138 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1139 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124, 1139, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": [ 1140 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": [ 1141 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124, 20, 1142, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": [ 1143 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 1143 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": [ 1144 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1144, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": [ 1145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1125, 1145 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": [ 1146 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2962 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 99305162, 524310, 65536, 0, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 2971 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2971 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2972 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1147 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1082, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1148 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1149 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1148, 1149, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": [ 1150 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1147, 1150 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": [ 1151 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117, 1146, 1151, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.11/self_attn/FusedAttention", "outputIndexes": [ 1152 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2973 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2973 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2974 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2974 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 99895008, 1048598, 131072, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 2975 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2975 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2976 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2976 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1153 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1069, 1153 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_output_0", "outputIndexes": [ 1154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 101074678, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1155 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1155 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2977 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2977 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2978 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 101082870, 1572886, 196608, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 2979 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2979 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2980 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1156 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1156 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1157 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102852364, 1572886, 196608, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 2983 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2983 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2984 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1158 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1157, 1158 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": [ 1159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1159 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2985 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2985 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2986 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2986 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 104621858, 1572886, 196608, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 2987 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2987 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2988 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2988 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1160 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 1160 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_1_output_0", "outputIndexes": [ 1161 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1161, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/Reshape_output_0", "outputIndexes": [ 1162 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1162 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 106391352, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1163 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1163 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2989 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2990 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106399544, 1048598, 131072, 0, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 2991 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2991 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2992 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2992 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1164 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1163 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": [ 1165 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1165 ] , "main_type": "NONE", "name": "Shape1867", "outputIndexes": [ 1166 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1165 ] , "main_type": "NONE", "name": "Rank1869", "outputIndexes": [ 1167 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 1167 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1871", "outputIndexes": [ 1168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1872", "outputIndexes": [ 1169 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1874", "outputIndexes": [ 1170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1875", "outputIndexes": [ 1171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1166, 1169, 1171, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1878", "outputIndexes": [ 1172 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1879", "outputIndexes": [ 1173 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1173, 1173 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1881", "outputIndexes": [ 1174 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1174, 1168 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": [ 1175 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1175, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1176 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1889", "outputIndexes": [ 1177 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1892", "outputIndexes": [ 1178 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1166, 1177, 1178, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1895", "outputIndexes": [ 1179 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1896", "outputIndexes": [ 1180 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1180 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1897", "outputIndexes": [ 1181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181, 1180 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1898", "outputIndexes": [ 1182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1182, 1168 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": [ 1183 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1184 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176, 1184, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": [ 1185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1164, 1185 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": [ 1186 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1186 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 107579214, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.12/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1188 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": [ 1189 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": [ 1190 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1190 ] , "main_type": "NONE", "name": "Shape1913", "outputIndexes": [ 1191 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1190 ] , "main_type": "NONE", "name": "Rank1915", "outputIndexes": [ 1192 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1192, 1192 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1917", "outputIndexes": [ 1193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1918", "outputIndexes": [ 1194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1193, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1920", "outputIndexes": [ 1195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1921", "outputIndexes": [ 1196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1191, 1194, 1196, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1924", "outputIndexes": [ 1197 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1925", "outputIndexes": [ 1198 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1198 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1926", "outputIndexes": [ 1199 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1199, 1198 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1927", "outputIndexes": [ 1200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1190, 1200, 1193 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": [ 1201 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1201, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": [ 1202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1203 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 1203, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": [ 1204 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": [ 1205 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1206 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 20, 1206, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": [ 1207 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205, 1207 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": [ 1208 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": [ 1209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1189, 1209 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": [ 1210 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 107580238, 524310, 65536, 0, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 2995 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2995 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2996 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2996 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1211 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1175, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1213 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1212, 1213, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": [ 1214 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211, 1214 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": [ 1215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1215 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 108170084, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.12/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1217 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": [ 1218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": [ 1219 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1219 ] , "main_type": "NONE", "name": "Shape1955", "outputIndexes": [ 1220 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1219 ] , "main_type": "NONE", "name": "Rank1957", "outputIndexes": [ 1221 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1221, 1221 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1959", "outputIndexes": [ 1222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1960", "outputIndexes": [ 1223 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1962", "outputIndexes": [ 1224 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1963", "outputIndexes": [ 1225 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1220, 1223, 1225, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1966", "outputIndexes": [ 1226 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1226 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1967", "outputIndexes": [ 1227 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1227 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1968", "outputIndexes": [ 1228 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1228, 1227 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1969", "outputIndexes": [ 1229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1219, 1229, 1222 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": [ 1230 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1230, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": [ 1231 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1232 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 1232, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": [ 1233 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1233 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": [ 1234 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 20, 1235, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": [ 1236 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234, 1236 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": [ 1237 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1237, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": [ 1238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1218, 1238 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": [ 1239 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 108171108, 524310, 65536, 0, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 2999 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2999 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3000 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3000 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1240 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1175, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1242 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1241, 1242, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": [ 1243 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 1243 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": [ 1244 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1210, 1239, 1244, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.12/self_attn/FusedAttention", "outputIndexes": [ 1245 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1245 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3001 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3001 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3002 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3002 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 108760954, 1048598, 131072, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 3003 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3003 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3004 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3004 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1246 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1162, 1246 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_output_0", "outputIndexes": [ 1247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 109940624, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1248 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1248 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3005 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3006 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 109948816, 1572886, 196608, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 3007 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3007 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3008 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3008 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1249 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1250 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 111718310, 1572886, 196608, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 3011 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3012 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1251 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1250, 1251 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": [ 1252 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1252 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3013 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3013 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3014 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 113487804, 1572886, 196608, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 3015 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3015 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3016 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3016 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1253 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 1253 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_1_output_0", "outputIndexes": [ 1254 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/Reshape_output_0", "outputIndexes": [ 1255 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1255 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 115257298, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1256 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3017 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3017 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3018 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 115265490, 1048598, 131072, 0, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 3019 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3019 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3020 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3020 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1257 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": [ 1258 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1258 ] , "main_type": "NONE", "name": "Shape2016", "outputIndexes": [ 1259 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1258 ] , "main_type": "NONE", "name": "Rank2018", "outputIndexes": [ 1260 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1260, 1260 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2020", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2021", "outputIndexes": [ 1262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2023", "outputIndexes": [ 1263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2024", "outputIndexes": [ 1264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259, 1262, 1264, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2027", "outputIndexes": [ 1265 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1265 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2028", "outputIndexes": [ 1266 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1266, 1266 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2030", "outputIndexes": [ 1267 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1267, 1261 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": [ 1268 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1269 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2038", "outputIndexes": [ 1270 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2041", "outputIndexes": [ 1271 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259, 1270, 1271, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2044", "outputIndexes": [ 1272 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1272 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2045", "outputIndexes": [ 1273 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1273 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2046", "outputIndexes": [ 1274 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1274, 1273 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2047", "outputIndexes": [ 1275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1275, 1261 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": [ 1276 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1277 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1269, 1277, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": [ 1278 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1257, 1278 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": [ 1279 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1279 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 116445160, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.13/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1281 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": [ 1282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": [ 1283 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1283 ] , "main_type": "NONE", "name": "Shape2062", "outputIndexes": [ 1284 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1283 ] , "main_type": "NONE", "name": "Rank2064", "outputIndexes": [ 1285 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285, 1285 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2066", "outputIndexes": [ 1286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2067", "outputIndexes": [ 1287 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2069", "outputIndexes": [ 1288 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1288 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2070", "outputIndexes": [ 1289 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284, 1287, 1289, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2073", "outputIndexes": [ 1290 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1290 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2074", "outputIndexes": [ 1291 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1291 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2075", "outputIndexes": [ 1292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292, 1291 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2076", "outputIndexes": [ 1293 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1283, 1293, 1286 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": [ 1294 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": [ 1295 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1296 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281, 1296, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": [ 1297 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1297 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": [ 1298 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281, 20, 1299, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": [ 1300 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298, 1300 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": [ 1301 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1301, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": [ 1302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1282, 1302 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": [ 1303 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 116446184, 524310, 65536, 0, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 3023 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3023 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3024 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3024 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1304 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1305 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1306 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 1306, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": [ 1307 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1304, 1307 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": [ 1308 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1308 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 117036030, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.13/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1310 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": [ 1311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": [ 1312 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1312 ] , "main_type": "NONE", "name": "Shape2104", "outputIndexes": [ 1313 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1312 ] , "main_type": "NONE", "name": "Rank2106", "outputIndexes": [ 1314 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1314, 1314 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2108", "outputIndexes": [ 1315 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2109", "outputIndexes": [ 1316 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2111", "outputIndexes": [ 1317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2112", "outputIndexes": [ 1318 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 1316, 1318, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2115", "outputIndexes": [ 1319 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2116", "outputIndexes": [ 1320 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1320 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2117", "outputIndexes": [ 1321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321, 1320 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2118", "outputIndexes": [ 1322 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1312, 1322, 1315 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": [ 1323 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": [ 1324 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1324, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1325 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310, 1325, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": [ 1326 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1326 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": [ 1327 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1324, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1310, 20, 1328, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": [ 1329 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 1329 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": [ 1330 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": [ 1331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311, 1331 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": [ 1332 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 117037054, 524310, 65536, 0, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 3027 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3027 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3028 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1333 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1334 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1335 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1334, 1335, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": [ 1336 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1333, 1336 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": [ 1337 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1303, 1332, 1337, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.13/self_attn/FusedAttention", "outputIndexes": [ 1338 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3029 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3029 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3030 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3030 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 117626900, 1048598, 131072, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 3031 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3032 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3032 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1339 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1255, 1339 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_output_0", "outputIndexes": [ 1340 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 118806570, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1341 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1341 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3033 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3033 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3034 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 118814762, 1572886, 196608, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 3035 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3035 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3036 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3036 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1342 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1342 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1343 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 120584256, 1572886, 196608, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 3039 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3039 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3040 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1344 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 1344 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": [ 1345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3041 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3041 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3042 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3042 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 122353750, 1572886, 196608, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 3043 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3044 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3044 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1346 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 1346 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_1_output_0", "outputIndexes": [ 1347 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1347, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/Reshape_output_0", "outputIndexes": [ 1348 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 124123244, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1349 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1349 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3045 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3045 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3046 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 124131436, 1048598, 131072, 0, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 3047 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3047 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3048 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3048 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1350 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1349 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": [ 1351 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1351 ] , "main_type": "NONE", "name": "Shape2165", "outputIndexes": [ 1352 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1351 ] , "main_type": "NONE", "name": "Rank2167", "outputIndexes": [ 1353 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1353, 1353 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2169", "outputIndexes": [ 1354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2170", "outputIndexes": [ 1355 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2172", "outputIndexes": [ 1356 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2173", "outputIndexes": [ 1357 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352, 1355, 1357, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2176", "outputIndexes": [ 1358 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1358 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2177", "outputIndexes": [ 1359 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1359, 1359 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2179", "outputIndexes": [ 1360 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1351, 1360, 1354 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": [ 1361 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1361, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2187", "outputIndexes": [ 1363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2190", "outputIndexes": [ 1364 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352, 1363, 1364, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2193", "outputIndexes": [ 1365 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1365 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2194", "outputIndexes": [ 1366 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1366 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2195", "outputIndexes": [ 1367 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1367, 1366 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2196", "outputIndexes": [ 1368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1351, 1368, 1354 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": [ 1369 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1362, 1370, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": [ 1371 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350, 1371 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": [ 1372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1372 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 125311106, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.14/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1374 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": [ 1375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": [ 1376 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1376 ] , "main_type": "NONE", "name": "Shape2211", "outputIndexes": [ 1377 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1376 ] , "main_type": "NONE", "name": "Rank2213", "outputIndexes": [ 1378 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378, 1378 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2215", "outputIndexes": [ 1379 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1379 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2216", "outputIndexes": [ 1380 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1379, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2218", "outputIndexes": [ 1381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2219", "outputIndexes": [ 1382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1377, 1380, 1382, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2222", "outputIndexes": [ 1383 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2223", "outputIndexes": [ 1384 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1384 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2224", "outputIndexes": [ 1385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1384 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2225", "outputIndexes": [ 1386 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1376, 1386, 1379 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": [ 1387 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": [ 1388 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1388, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1389 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374, 1389, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": [ 1390 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1390 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": [ 1391 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1388, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374, 20, 1392, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": [ 1393 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391, 1393 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": [ 1394 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": [ 1395 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375, 1395 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": [ 1396 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 125312130, 524310, 65536, 0, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 3051 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3051 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3052 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3052 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1397 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1361, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1398 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1399 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1398, 1399, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": [ 1400 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1397, 1400 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": [ 1401 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1401 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 125901976, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.14/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1403 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1403, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": [ 1404 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1403 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": [ 1405 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1405 ] , "main_type": "NONE", "name": "Shape2253", "outputIndexes": [ 1406 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1405 ] , "main_type": "NONE", "name": "Rank2255", "outputIndexes": [ 1407 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1407 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2257", "outputIndexes": [ 1408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2258", "outputIndexes": [ 1409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2260", "outputIndexes": [ 1410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2261", "outputIndexes": [ 1411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1406, 1409, 1411, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2264", "outputIndexes": [ 1412 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2265", "outputIndexes": [ 1413 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1413 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2266", "outputIndexes": [ 1414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1414, 1413 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2267", "outputIndexes": [ 1415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 1415, 1408 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": [ 1416 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": [ 1417 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1417, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1403, 1418, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": [ 1419 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": [ 1420 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1417, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1421 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1403, 20, 1421, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": [ 1422 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 1422 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": [ 1423 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1423, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": [ 1424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1404, 1424 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": [ 1425 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 125903000, 524310, 65536, 0, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 3055 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3055 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3056 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3056 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1426 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1361, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1427 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1428 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1427, 1428, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": [ 1429 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1426, 1429 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": [ 1430 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1396, 1425, 1430, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.14/self_attn/FusedAttention", "outputIndexes": [ 1431 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1431 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3057 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3057 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3058 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3058 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 126492846, 1048598, 131072, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 3059 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3059 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3060 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3060 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348, 1432 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_output_0", "outputIndexes": [ 1433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 127672516, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1434 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3061 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3061 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3062 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3062 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 127680708, 1572886, 196608, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 3063 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3063 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3064 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3064 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1435 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1435 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1436 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3062 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 129450202, 1572886, 196608, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 3067 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3067 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3068 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1437 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 1437 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": [ 1438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1438 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3069 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3069 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3070 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3070 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131219696, 1572886, 196608, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 3071 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3071 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3072 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3072 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1439 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 1439 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_1_output_0", "outputIndexes": [ 1440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1440, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/Reshape_output_0", "outputIndexes": [ 1441 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 132989190, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1442 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1442 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3073 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3074 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 132997382, 1048598, 131072, 0, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 3075 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3075 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3076 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3076 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1443 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1442 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": [ 1444 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1444 ] , "main_type": "NONE", "name": "Shape2314", "outputIndexes": [ 1445 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1444 ] , "main_type": "NONE", "name": "Rank2316", "outputIndexes": [ 1446 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 1446 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2318", "outputIndexes": [ 1447 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2319", "outputIndexes": [ 1448 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2321", "outputIndexes": [ 1449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2322", "outputIndexes": [ 1450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 1448, 1450, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2325", "outputIndexes": [ 1451 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1451 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2326", "outputIndexes": [ 1452 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1452, 1452 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2328", "outputIndexes": [ 1453 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1444, 1453, 1447 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": [ 1454 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1454, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1455 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2336", "outputIndexes": [ 1456 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2339", "outputIndexes": [ 1457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 1456, 1457, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2342", "outputIndexes": [ 1458 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1458 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2343", "outputIndexes": [ 1459 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1459 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2344", "outputIndexes": [ 1460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1460, 1459 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2345", "outputIndexes": [ 1461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1444, 1461, 1447 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": [ 1462 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1463 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1455, 1463, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": [ 1464 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1443, 1464 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": [ 1465 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1465 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 134177052, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.15/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1467 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": [ 1468 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": [ 1469 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1469 ] , "main_type": "NONE", "name": "Shape2360", "outputIndexes": [ 1470 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1469 ] , "main_type": "NONE", "name": "Rank2362", "outputIndexes": [ 1471 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471, 1471 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2364", "outputIndexes": [ 1472 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2365", "outputIndexes": [ 1473 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2367", "outputIndexes": [ 1474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2368", "outputIndexes": [ 1475 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470, 1473, 1475, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2371", "outputIndexes": [ 1476 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2372", "outputIndexes": [ 1477 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1477 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2373", "outputIndexes": [ 1478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478, 1477 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2374", "outputIndexes": [ 1479 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1469, 1479, 1472 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": [ 1480 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1480, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": [ 1481 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1481, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1482 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 1482, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": [ 1483 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": [ 1484 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1481, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1485 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 20, 1485, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": [ 1486 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1484, 1486 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": [ 1487 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1487, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": [ 1488 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1468, 1488 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": [ 1489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 134178076, 524310, 65536, 0, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 3079 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3079 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3080 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3080 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1490 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1454, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1492 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 1492, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": [ 1493 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1490, 1493 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": [ 1494 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 134767922, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.15/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1496 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": [ 1497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": [ 1498 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1498 ] , "main_type": "NONE", "name": "Shape2402", "outputIndexes": [ 1499 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1498 ] , "main_type": "NONE", "name": "Rank2404", "outputIndexes": [ 1500 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1500, 1500 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2406", "outputIndexes": [ 1501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2407", "outputIndexes": [ 1502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2409", "outputIndexes": [ 1503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2410", "outputIndexes": [ 1504 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499, 1502, 1504, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2413", "outputIndexes": [ 1505 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1505 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2414", "outputIndexes": [ 1506 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1506 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2415", "outputIndexes": [ 1507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1507, 1506 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2416", "outputIndexes": [ 1508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1498, 1508, 1501 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": [ 1509 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1509, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": [ 1510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1511 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 1511, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": [ 1512 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1512 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": [ 1513 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1514 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 20, 1514, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": [ 1515 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 1515 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": [ 1516 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1516, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": [ 1517 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 1517 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": [ 1518 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 134768946, 524310, 65536, 0, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 3083 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3083 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3084 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1519 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1454, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1520 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1520, 1521, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": [ 1522 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1519, 1522 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": [ 1523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1489, 1518, 1523, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.15/self_attn/FusedAttention", "outputIndexes": [ 1524 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3085 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3085 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3086 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3086 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 135358792, 1048598, 131072, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 3087 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3088 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3088 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1525 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441, 1525 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_output_0", "outputIndexes": [ 1526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 136538462, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1527 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3089 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3090 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3090 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 136546654, 1572886, 196608, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 3091 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3091 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3092 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3092 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1528 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1529 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3090 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 138316148, 1572886, 196608, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 3095 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3095 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3096 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1530 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1529, 1530 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": [ 1531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1531 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3097 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3097 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3098 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3098 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 140085642, 1572886, 196608, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 3099 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3099 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3100 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3100 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1532 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 1532 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_1_output_0", "outputIndexes": [ 1533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1533, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/Reshape_output_0", "outputIndexes": [ 1534 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 141855136, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1535 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3101 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3101 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3102 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 141863328, 1048598, 131072, 0, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 3103 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3103 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3104 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3104 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1536 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": [ 1537 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1537 ] , "main_type": "NONE", "name": "Shape2463", "outputIndexes": [ 1538 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1537 ] , "main_type": "NONE", "name": "Rank2465", "outputIndexes": [ 1539 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1539, 1539 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2467", "outputIndexes": [ 1540 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2468", "outputIndexes": [ 1541 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2470", "outputIndexes": [ 1542 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2471", "outputIndexes": [ 1543 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1538, 1541, 1543, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2474", "outputIndexes": [ 1544 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1544 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2475", "outputIndexes": [ 1545 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1545, 1545 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2477", "outputIndexes": [ 1546 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537, 1546, 1540 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": [ 1547 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1548 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2485", "outputIndexes": [ 1549 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2488", "outputIndexes": [ 1550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1538, 1549, 1550, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2491", "outputIndexes": [ 1551 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2492", "outputIndexes": [ 1552 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1552 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2493", "outputIndexes": [ 1553 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553, 1552 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2494", "outputIndexes": [ 1554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537, 1554, 1540 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": [ 1555 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1556 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1548, 1556, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": [ 1557 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1536, 1557 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": [ 1558 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 143042998, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.16/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1560 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": [ 1561 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": [ 1562 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Shape2509", "outputIndexes": [ 1563 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Rank2511", "outputIndexes": [ 1564 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1564 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2513", "outputIndexes": [ 1565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2514", "outputIndexes": [ 1566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2516", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2517", "outputIndexes": [ 1568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1566, 1568, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2520", "outputIndexes": [ 1569 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2521", "outputIndexes": [ 1570 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1570 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2522", "outputIndexes": [ 1571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1571, 1570 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2523", "outputIndexes": [ 1572 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562, 1572, 1565 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": [ 1573 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1573, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": [ 1574 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1574, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560, 1575, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": [ 1576 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1576 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": [ 1577 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1574, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1578 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560, 20, 1578, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": [ 1579 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1577, 1579 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": [ 1580 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": [ 1581 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1561, 1581 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": [ 1582 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 143044022, 524310, 65536, 0, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 3107 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3108 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3108 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1584 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1585 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1584, 1585, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": [ 1586 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 1586 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": [ 1587 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 143633868, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.16/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1589 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": [ 1591 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1591 ] , "main_type": "NONE", "name": "Shape2551", "outputIndexes": [ 1592 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1591 ] , "main_type": "NONE", "name": "Rank2553", "outputIndexes": [ 1593 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1593, 1593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2555", "outputIndexes": [ 1594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2556", "outputIndexes": [ 1595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2558", "outputIndexes": [ 1596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2559", "outputIndexes": [ 1597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592, 1595, 1597, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2562", "outputIndexes": [ 1598 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1598 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2563", "outputIndexes": [ 1599 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1599 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2564", "outputIndexes": [ 1600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1600, 1599 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2565", "outputIndexes": [ 1601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1591, 1601, 1594 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": [ 1602 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1602, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": [ 1603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1604 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 1604, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": [ 1605 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1605 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": [ 1606 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1589, 20, 1607, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": [ 1608 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 1608 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": [ 1609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1609, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": [ 1610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590, 1610 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": [ 1611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 143634892, 524310, 65536, 0, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 3111 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3112 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1547, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1613 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1613, 1614, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": [ 1615 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1615 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": [ 1616 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1582, 1611, 1616, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.16/self_attn/FusedAttention", "outputIndexes": [ 1617 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3113 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3113 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3114 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3114 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 144224738, 1048598, 131072, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 3115 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3115 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3116 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3116 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 1618 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_output_0", "outputIndexes": [ 1619 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 145404408, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1620 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1620 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3118 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3118 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 145412600, 1572886, 196608, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 3119 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3119 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3120 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3120 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1621 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1622 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3118 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 147182094, 1572886, 196608, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 3123 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3123 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3124 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1622, 1623 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3125 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3125 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3126 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3126 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 148951588, 1572886, 196608, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 3127 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3127 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3128 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3128 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1625 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619, 1625 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_1_output_0", "outputIndexes": [ 1626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/Reshape_output_0", "outputIndexes": [ 1627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 150721082, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1628 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3129 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3129 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3130 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 150729274, 1048598, 131072, 0, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 3131 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3131 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3132 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3132 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": [ 1630 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1630 ] , "main_type": "NONE", "name": "Shape2612", "outputIndexes": [ 1631 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1630 ] , "main_type": "NONE", "name": "Rank2614", "outputIndexes": [ 1632 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1632, 1632 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2616", "outputIndexes": [ 1633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2617", "outputIndexes": [ 1634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2619", "outputIndexes": [ 1635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2620", "outputIndexes": [ 1636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1631, 1634, 1636, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2623", "outputIndexes": [ 1637 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1637 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2624", "outputIndexes": [ 1638 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1638, 1638 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2626", "outputIndexes": [ 1639 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 1639, 1633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": [ 1640 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1641 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2634", "outputIndexes": [ 1642 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2637", "outputIndexes": [ 1643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1631, 1642, 1643, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2640", "outputIndexes": [ 1644 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1644 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2641", "outputIndexes": [ 1645 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1645 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2642", "outputIndexes": [ 1646 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1646, 1645 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2643", "outputIndexes": [ 1647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 1647, 1633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": [ 1648 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1641, 1649, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": [ 1650 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1629, 1650 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": [ 1651 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 151908944, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.17/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1653 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": [ 1654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": [ 1655 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1655 ] , "main_type": "NONE", "name": "Shape2658", "outputIndexes": [ 1656 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1655 ] , "main_type": "NONE", "name": "Rank2660", "outputIndexes": [ 1657 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1657, 1657 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2662", "outputIndexes": [ 1658 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2663", "outputIndexes": [ 1659 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2665", "outputIndexes": [ 1660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1660 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2666", "outputIndexes": [ 1661 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656, 1659, 1661, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2669", "outputIndexes": [ 1662 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2670", "outputIndexes": [ 1663 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1663 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2671", "outputIndexes": [ 1664 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1664, 1663 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2672", "outputIndexes": [ 1665 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1655, 1665, 1658 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": [ 1666 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1666, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": [ 1667 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1667, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1668 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1668, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": [ 1669 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": [ 1670 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1667, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1671 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 20, 1671, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": [ 1672 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1670, 1672 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": [ 1673 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1673, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": [ 1674 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654, 1674 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": [ 1675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 151909968, 524310, 65536, 0, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 3135 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3135 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3136 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1676 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677, 1678, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": [ 1679 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676, 1679 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": [ 1680 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1680 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 152499814, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.17/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1682 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1682, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": [ 1683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1682 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": [ 1684 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1684 ] , "main_type": "NONE", "name": "Shape2700", "outputIndexes": [ 1685 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1684 ] , "main_type": "NONE", "name": "Rank2702", "outputIndexes": [ 1686 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 1686 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2704", "outputIndexes": [ 1687 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1687 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2705", "outputIndexes": [ 1688 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1687, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2707", "outputIndexes": [ 1689 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2708", "outputIndexes": [ 1690 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1685, 1688, 1690, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2711", "outputIndexes": [ 1691 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1691 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2712", "outputIndexes": [ 1692 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1692 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2713", "outputIndexes": [ 1693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1693, 1692 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2714", "outputIndexes": [ 1694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1684, 1694, 1687 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": [ 1695 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": [ 1696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1697 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1682, 1697, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": [ 1698 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1698 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": [ 1699 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1700 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1682, 20, 1700, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": [ 1701 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 1701 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": [ 1702 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1702, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": [ 1703 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1683, 1703 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": [ 1704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 152500838, 524310, 65536, 0, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 3139 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3139 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3140 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1705 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1706 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1707 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706, 1707, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": [ 1708 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1705, 1708 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": [ 1709 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1675, 1704, 1709, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.17/self_attn/FusedAttention", "outputIndexes": [ 1710 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1710 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3141 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3141 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3142 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3142 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 153090684, 1048598, 131072, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 3143 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3143 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3144 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3144 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1711 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627, 1711 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_output_0", "outputIndexes": [ 1712 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 154270354, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1713 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3145 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3145 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3146 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3146 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 154278546, 1572886, 196608, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 3147 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3147 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3148 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3148 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1714 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1714 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1715 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3146 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 156048040, 1572886, 196608, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 3151 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3151 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3152 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715, 1716 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": [ 1717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1717 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3153 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3153 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3154 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3154 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 157817534, 1572886, 196608, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 3155 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3155 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3156 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3156 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 1718 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_1_output_0", "outputIndexes": [ 1719 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1719, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/Reshape_output_0", "outputIndexes": [ 1720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1720 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 159587028, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1721 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1721 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3157 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3157 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3158 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3158 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 159595220, 1048598, 131072, 0, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 3159 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3159 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3160 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3160 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1722 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1721 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": [ 1723 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1723 ] , "main_type": "NONE", "name": "Shape2761", "outputIndexes": [ 1724 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1723 ] , "main_type": "NONE", "name": "Rank2763", "outputIndexes": [ 1725 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1725, 1725 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2765", "outputIndexes": [ 1726 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2766", "outputIndexes": [ 1727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2768", "outputIndexes": [ 1728 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1728 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2769", "outputIndexes": [ 1729 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1724, 1727, 1729, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2772", "outputIndexes": [ 1730 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1730 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2773", "outputIndexes": [ 1731 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1731, 1731 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2775", "outputIndexes": [ 1732 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723, 1732, 1726 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": [ 1733 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1734 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2783", "outputIndexes": [ 1735 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1728 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2786", "outputIndexes": [ 1736 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1724, 1735, 1736, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2789", "outputIndexes": [ 1737 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2790", "outputIndexes": [ 1738 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1738 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2791", "outputIndexes": [ 1739 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739, 1738 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2792", "outputIndexes": [ 1740 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723, 1740, 1726 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": [ 1741 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1742 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734, 1742, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": [ 1743 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1722, 1743 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": [ 1744 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1744 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 160774890, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.18/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1746 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": [ 1747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": [ 1748 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1748 ] , "main_type": "NONE", "name": "Shape2807", "outputIndexes": [ 1749 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1748 ] , "main_type": "NONE", "name": "Rank2809", "outputIndexes": [ 1750 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 1750 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2811", "outputIndexes": [ 1751 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1751 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2812", "outputIndexes": [ 1752 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1751, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2814", "outputIndexes": [ 1753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1753 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2815", "outputIndexes": [ 1754 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1749, 1752, 1754, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2818", "outputIndexes": [ 1755 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1755 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2819", "outputIndexes": [ 1756 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1756 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2820", "outputIndexes": [ 1757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1757, 1756 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2821", "outputIndexes": [ 1758 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1748, 1758, 1751 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": [ 1759 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1759, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": [ 1760 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1760, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1761 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 1761, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": [ 1762 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1762 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": [ 1763 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1760, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1764 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 20, 1764, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": [ 1765 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 1765 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": [ 1766 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": [ 1767 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747, 1767 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": [ 1768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3158 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 160775914, 524310, 65536, 0, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 3163 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3163 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3164 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3164 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1769 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1770 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1771 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770, 1771, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": [ 1772 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1769, 1772 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": [ 1773 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1773 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 161365760, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.18/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1775 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": [ 1776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": [ 1777 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1777 ] , "main_type": "NONE", "name": "Shape2849", "outputIndexes": [ 1778 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1777 ] , "main_type": "NONE", "name": "Rank2851", "outputIndexes": [ 1779 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779, 1779 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2853", "outputIndexes": [ 1780 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1780 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2854", "outputIndexes": [ 1781 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1780, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2856", "outputIndexes": [ 1782 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1782 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2857", "outputIndexes": [ 1783 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1778, 1781, 1783, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2860", "outputIndexes": [ 1784 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1784 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2861", "outputIndexes": [ 1785 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1785 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2862", "outputIndexes": [ 1786 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1786, 1785 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2863", "outputIndexes": [ 1787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1777, 1787, 1780 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": [ 1788 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": [ 1789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1789, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1790 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 1790, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": [ 1791 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1791 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": [ 1792 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1789, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1793 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 20, 1793, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": [ 1794 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 1794 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": [ 1795 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": [ 1796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1776, 1796 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": [ 1797 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3158 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 161366784, 524310, 65536, 0, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 3167 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3167 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3168 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1798 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1733, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1799 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1799, 1800, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": [ 1801 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1798, 1801 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": [ 1802 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768, 1797, 1802, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.18/self_attn/FusedAttention", "outputIndexes": [ 1803 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1803 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3169 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3169 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3170 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3170 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 161956630, 1048598, 131072, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 3171 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3171 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3172 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3172 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1804 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1720, 1804 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_output_0", "outputIndexes": [ 1805 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 163136300, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1806 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1806 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3173 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3174 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 163144492, 1572886, 196608, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 3175 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3175 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3176 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3176 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1807 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1807 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1808 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 164913986, 1572886, 196608, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 3179 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3180 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1808, 1809 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": [ 1810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1810 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3181 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3181 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3182 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3182 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 166683480, 1572886, 196608, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 3183 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3183 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3184 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3184 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1811 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 1811 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_1_output_0", "outputIndexes": [ 1812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1812, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/Reshape_output_0", "outputIndexes": [ 1813 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1813 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 168452974, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1814 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1814 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3185 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3185 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3186 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3186 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 168461166, 1048598, 131072, 0, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 3187 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3187 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3188 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3188 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1815 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1814 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": [ 1816 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1816 ] , "main_type": "NONE", "name": "Shape2910", "outputIndexes": [ 1817 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1816 ] , "main_type": "NONE", "name": "Rank2912", "outputIndexes": [ 1818 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818, 1818 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2914", "outputIndexes": [ 1819 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2915", "outputIndexes": [ 1820 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2917", "outputIndexes": [ 1821 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2918", "outputIndexes": [ 1822 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1817, 1820, 1822, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2921", "outputIndexes": [ 1823 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1823 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2922", "outputIndexes": [ 1824 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1824, 1824 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2924", "outputIndexes": [ 1825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1816, 1825, 1819 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": [ 1826 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1827 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2932", "outputIndexes": [ 1828 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2935", "outputIndexes": [ 1829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1817, 1828, 1829, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2938", "outputIndexes": [ 1830 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2939", "outputIndexes": [ 1831 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1831 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2940", "outputIndexes": [ 1832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832, 1831 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2941", "outputIndexes": [ 1833 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1816, 1833, 1819 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": [ 1834 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827, 1835, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": [ 1836 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1815, 1836 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": [ 1837 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1837 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 169640836, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.19/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1839 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": [ 1840 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": [ 1841 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1841 ] , "main_type": "NONE", "name": "Shape2956", "outputIndexes": [ 1842 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1841 ] , "main_type": "NONE", "name": "Rank2958", "outputIndexes": [ 1843 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843, 1843 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2960", "outputIndexes": [ 1844 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1844 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2961", "outputIndexes": [ 1845 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1844, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2963", "outputIndexes": [ 1846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1846 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2964", "outputIndexes": [ 1847 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1842, 1845, 1847, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2967", "outputIndexes": [ 1848 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1848 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2968", "outputIndexes": [ 1849 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1849 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2969", "outputIndexes": [ 1850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 1849 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2970", "outputIndexes": [ 1851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841, 1851, 1844 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": [ 1852 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": [ 1853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1854 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 1854, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": [ 1855 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": [ 1856 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1857 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20, 1857, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": [ 1858 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1856, 1858 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": [ 1859 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1859, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": [ 1860 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1840, 1860 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": [ 1861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3186 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 169641860, 524310, 65536, 0, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 3191 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3191 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3192 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3192 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1862 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1864 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1863, 1864, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": [ 1865 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1862, 1865 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": [ 1866 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 170231706, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.19/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1868 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": [ 1869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": [ 1870 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1870 ] , "main_type": "NONE", "name": "Shape2998", "outputIndexes": [ 1871 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1870 ] , "main_type": "NONE", "name": "Rank3000", "outputIndexes": [ 1872 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 1872 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3002", "outputIndexes": [ 1873 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3003", "outputIndexes": [ 1874 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3005", "outputIndexes": [ 1875 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1875 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3006", "outputIndexes": [ 1876 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1871, 1874, 1876, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3009", "outputIndexes": [ 1877 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3010", "outputIndexes": [ 1878 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1878 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3011", "outputIndexes": [ 1879 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 1878 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3012", "outputIndexes": [ 1880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1870, 1880, 1873 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": [ 1881 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1881, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": [ 1882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1883 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868, 1883, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": [ 1884 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": [ 1885 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1868, 20, 1886, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": [ 1887 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 1887 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": [ 1888 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1888, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": [ 1889 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1869, 1889 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": [ 1890 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3186 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 170232730, 524310, 65536, 0, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 3195 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3196 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3196 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1891 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1893 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1892, 1893, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": [ 1894 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 1894 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": [ 1895 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1861, 1890, 1895, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.19/self_attn/FusedAttention", "outputIndexes": [ 1896 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1896 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3197 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3197 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3198 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3198 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 170822576, 1048598, 131072, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 3199 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3199 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3200 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1897 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1813, 1897 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_output_0", "outputIndexes": [ 1898 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 172002246, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1899 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1899 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3201 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3202 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 172010438, 1572886, 196608, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 3203 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3203 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3204 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3204 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1900 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1901 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 173779932, 1572886, 196608, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 3207 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3207 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3208 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3208 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1902 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1901, 1902 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": [ 1903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1903 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3209 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3209 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3210 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3210 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 175549426, 1572886, 196608, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 3211 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3211 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3212 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3212 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1904 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898, 1904 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_1_output_0", "outputIndexes": [ 1905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1905, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/Reshape_output_0", "outputIndexes": [ 1906 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1906 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 177318920, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1907 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3213 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3213 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3214 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 177327112, 1048598, 131072, 0, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 3215 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3215 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3216 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3216 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1908 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": [ 1909 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1909 ] , "main_type": "NONE", "name": "Shape3059", "outputIndexes": [ 1910 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1909 ] , "main_type": "NONE", "name": "Rank3061", "outputIndexes": [ 1911 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1911, 1911 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3063", "outputIndexes": [ 1912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3064", "outputIndexes": [ 1913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3066", "outputIndexes": [ 1914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3067", "outputIndexes": [ 1915 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910, 1913, 1915, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3070", "outputIndexes": [ 1916 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3071", "outputIndexes": [ 1917 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1917, 1917 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3073", "outputIndexes": [ 1918 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909, 1918, 1912 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": [ 1919 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1920 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3081", "outputIndexes": [ 1921 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3084", "outputIndexes": [ 1922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910, 1921, 1922, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3087", "outputIndexes": [ 1923 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3088", "outputIndexes": [ 1924 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1924 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3089", "outputIndexes": [ 1925 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925, 1924 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3090", "outputIndexes": [ 1926 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909, 1926, 1912 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": [ 1927 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1928 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1928, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": [ 1929 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1908, 1929 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": [ 1930 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 178506782, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.20/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 1932 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": [ 1933 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": [ 1934 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1934 ] , "main_type": "NONE", "name": "Shape3105", "outputIndexes": [ 1935 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1934 ] , "main_type": "NONE", "name": "Rank3107", "outputIndexes": [ 1936 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 1936 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3109", "outputIndexes": [ 1937 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1937 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3110", "outputIndexes": [ 1938 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1937, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3112", "outputIndexes": [ 1939 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3113", "outputIndexes": [ 1940 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1935, 1938, 1940, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3116", "outputIndexes": [ 1941 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3117", "outputIndexes": [ 1942 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1942 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3118", "outputIndexes": [ 1943 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1943, 1942 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3119", "outputIndexes": [ 1944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1934, 1944, 1937 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": [ 1945 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1945, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": [ 1946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1947 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932, 1947, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": [ 1948 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": [ 1949 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1950 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932, 20, 1950, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": [ 1951 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1949, 1951 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": [ 1952 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1952, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": [ 1953 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1933, 1953 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": [ 1954 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 178507806, 524310, 65536, 0, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 3219 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3219 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3220 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1955 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1956 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1957 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1956, 1957, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": [ 1958 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955, 1958 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": [ 1959 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1959 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 179097652, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.20/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 1961 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": [ 1962 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": [ 1963 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1963 ] , "main_type": "NONE", "name": "Shape3147", "outputIndexes": [ 1964 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1963 ] , "main_type": "NONE", "name": "Rank3149", "outputIndexes": [ 1965 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1965, 1965 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3151", "outputIndexes": [ 1966 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3152", "outputIndexes": [ 1967 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3154", "outputIndexes": [ 1968 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3155", "outputIndexes": [ 1969 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1964, 1967, 1969, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3158", "outputIndexes": [ 1970 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1970 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3159", "outputIndexes": [ 1971 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 1971 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3160", "outputIndexes": [ 1972 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1972, 1971 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3161", "outputIndexes": [ 1973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1963, 1973, 1966 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": [ 1974 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1974, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": [ 1975 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1976 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 1976, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": [ 1977 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1977 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": [ 1978 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1979 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 20, 1979, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": [ 1980 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1978, 1980 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": [ 1981 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1981, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": [ 1982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1962, 1982 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": [ 1983 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 179098676, 524310, 65536, 0, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 3223 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3224 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3224 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1984 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1986 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1985, 1986, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": [ 1987 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1984, 1987 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": [ 1988 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1954, 1983, 1988, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.20/self_attn/FusedAttention", "outputIndexes": [ 1989 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1989 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3225 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3225 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3226 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3226 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 179688522, 1048598, 131072, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 3227 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3227 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3228 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3228 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1990 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1906, 1990 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_output_0", "outputIndexes": [ 1991 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 180868192, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1992 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1992 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3229 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3230 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 180876384, 1572886, 196608, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 3231 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3231 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3232 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3232 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1993 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1993 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1994 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 182645878, 1572886, 196608, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 3235 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3235 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3236 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1994, 1995 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": [ 1996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3237 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3237 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3238 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 184415372, 1572886, 196608, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 3239 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3239 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3240 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3240 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1997 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 1997 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_1_output_0", "outputIndexes": [ 1998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/Reshape_output_0", "outputIndexes": [ 1999 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1999 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 186184866, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2000 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2000 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3241 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3241 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3242 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3242 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 186193058, 1048598, 131072, 0, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 3243 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3244 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3244 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2001 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2000 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": [ 2002 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2002 ] , "main_type": "NONE", "name": "Shape3208", "outputIndexes": [ 2003 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2002 ] , "main_type": "NONE", "name": "Rank3210", "outputIndexes": [ 2004 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004, 2004 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3212", "outputIndexes": [ 2005 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3213", "outputIndexes": [ 2006 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3215", "outputIndexes": [ 2007 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3216", "outputIndexes": [ 2008 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2003, 2006, 2008, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3219", "outputIndexes": [ 2009 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2009 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3220", "outputIndexes": [ 2010 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010, 2010 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3222", "outputIndexes": [ 2011 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2002, 2011, 2005 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": [ 2012 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3230", "outputIndexes": [ 2014 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3233", "outputIndexes": [ 2015 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2003, 2014, 2015, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3236", "outputIndexes": [ 2016 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2016 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3237", "outputIndexes": [ 2017 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2017 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3238", "outputIndexes": [ 2018 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018, 2017 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3239", "outputIndexes": [ 2019 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2002, 2019, 2005 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": [ 2020 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2021 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013, 2021, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": [ 2022 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2001, 2022 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": [ 2023 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2023 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 187372728, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.21/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2025 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": [ 2026 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": [ 2027 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2027 ] , "main_type": "NONE", "name": "Shape3254", "outputIndexes": [ 2028 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2027 ] , "main_type": "NONE", "name": "Rank3256", "outputIndexes": [ 2029 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2029, 2029 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3258", "outputIndexes": [ 2030 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3259", "outputIndexes": [ 2031 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3261", "outputIndexes": [ 2032 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2032 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3262", "outputIndexes": [ 2033 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 2031, 2033, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3265", "outputIndexes": [ 2034 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2034 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3266", "outputIndexes": [ 2035 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2035 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3267", "outputIndexes": [ 2036 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2036, 2035 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3268", "outputIndexes": [ 2037 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027, 2037, 2030 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": [ 2038 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2038, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": [ 2039 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2039, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2040 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 2040, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": [ 2041 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2041 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": [ 2042 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2039, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2043 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20, 2043, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": [ 2044 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2042, 2044 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": [ 2045 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2045, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": [ 2046 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2026, 2046 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": [ 2047 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3242 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187373752, 524310, 65536, 0, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 3247 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3247 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3248 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3248 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2048 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2049 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2050 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2049, 2050, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": [ 2051 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2048, 2051 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": [ 2052 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 187963598, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.21/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2054 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": [ 2055 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": [ 2056 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2056 ] , "main_type": "NONE", "name": "Shape3296", "outputIndexes": [ 2057 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2056 ] , "main_type": "NONE", "name": "Rank3298", "outputIndexes": [ 2058 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058, 2058 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3300", "outputIndexes": [ 2059 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3301", "outputIndexes": [ 2060 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3303", "outputIndexes": [ 2061 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2061 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3304", "outputIndexes": [ 2062 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 2060, 2062, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3307", "outputIndexes": [ 2063 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2063 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3308", "outputIndexes": [ 2064 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2064 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3309", "outputIndexes": [ 2065 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2065, 2064 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3310", "outputIndexes": [ 2066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2056, 2066, 2059 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": [ 2067 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2067, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": [ 2068 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2069 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 2069, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": [ 2070 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2070 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": [ 2071 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2072 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2054, 20, 2072, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": [ 2073 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 2073 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": [ 2074 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2074, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": [ 2075 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 2075 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": [ 2076 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3242 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187964622, 524310, 65536, 0, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 3251 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3251 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3252 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2077 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2078 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2078, 2079, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": [ 2080 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 2080 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": [ 2081 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2047, 2076, 2081, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.21/self_attn/FusedAttention", "outputIndexes": [ 2082 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2082 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3253 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3253 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3254 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3254 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 188554468, 1048598, 131072, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 3255 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3255 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3256 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3256 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2083 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1999, 2083 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_output_0", "outputIndexes": [ 2084 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 189734138, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2085 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3257 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3257 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3258 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3258 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 189742330, 1572886, 196608, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 3259 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3259 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3260 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3260 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2086 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2086 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2087 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3258 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 191511824, 1572886, 196608, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 3263 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3263 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3264 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2088 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087, 2088 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": [ 2089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2089 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3265 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3265 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3266 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3266 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 193281318, 1572886, 196608, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 3267 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3267 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3268 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3268 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2090 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084, 2090 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_1_output_0", "outputIndexes": [ 2091 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2091, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/Reshape_output_0", "outputIndexes": [ 2092 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 195050812, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2093 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3269 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3270 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 195059004, 1048598, 131072, 0, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 3271 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3271 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3272 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3272 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2094 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": [ 2095 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2095 ] , "main_type": "NONE", "name": "Shape3357", "outputIndexes": [ 2096 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2095 ] , "main_type": "NONE", "name": "Rank3359", "outputIndexes": [ 2097 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2097 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3361", "outputIndexes": [ 2098 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3362", "outputIndexes": [ 2099 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3364", "outputIndexes": [ 2100 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2100 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3365", "outputIndexes": [ 2101 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2099, 2101, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3368", "outputIndexes": [ 2102 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2102 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3369", "outputIndexes": [ 2103 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103, 2103 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3371", "outputIndexes": [ 2104 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2104, 2098 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": [ 2105 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2105, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2106 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3379", "outputIndexes": [ 2107 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2100 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3382", "outputIndexes": [ 2108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2107, 2108, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3385", "outputIndexes": [ 2109 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2109 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3386", "outputIndexes": [ 2110 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2110 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3387", "outputIndexes": [ 2111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2111, 2110 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3388", "outputIndexes": [ 2112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2112, 2098 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": [ 2113 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2114 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 2114, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": [ 2115 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094, 2115 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": [ 2116 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2116 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 196238674, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.22/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2118 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": [ 2119 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": [ 2120 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2120 ] , "main_type": "NONE", "name": "Shape3403", "outputIndexes": [ 2121 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2120 ] , "main_type": "NONE", "name": "Rank3405", "outputIndexes": [ 2122 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122, 2122 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3407", "outputIndexes": [ 2123 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2123 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3408", "outputIndexes": [ 2124 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2123, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3410", "outputIndexes": [ 2125 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2125 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3411", "outputIndexes": [ 2126 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2121, 2124, 2126, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3414", "outputIndexes": [ 2127 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2127 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3415", "outputIndexes": [ 2128 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2128 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3416", "outputIndexes": [ 2129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2129, 2128 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3417", "outputIndexes": [ 2130 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120, 2130, 2123 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": [ 2131 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2131, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": [ 2132 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2132, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2133 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 2133, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": [ 2134 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2134 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": [ 2135 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2132, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2136 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 20, 2136, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": [ 2137 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2135, 2137 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": [ 2138 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2138, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": [ 2139 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2139 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": [ 2140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196239698, 524310, 65536, 0, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 3275 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3275 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3276 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3276 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2141 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2105, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2143 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2142, 2143, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": [ 2144 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2141, 2144 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": [ 2145 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2145 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 196829544, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.22/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2147 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": [ 2148 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": [ 2149 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2149 ] , "main_type": "NONE", "name": "Shape3445", "outputIndexes": [ 2150 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2149 ] , "main_type": "NONE", "name": "Rank3447", "outputIndexes": [ 2151 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151, 2151 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3449", "outputIndexes": [ 2152 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2152 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3450", "outputIndexes": [ 2153 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2152, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3452", "outputIndexes": [ 2154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2154 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3453", "outputIndexes": [ 2155 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2150, 2153, 2155, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3456", "outputIndexes": [ 2156 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2156 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3457", "outputIndexes": [ 2157 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2157 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3458", "outputIndexes": [ 2158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158, 2157 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3459", "outputIndexes": [ 2159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149, 2159, 2152 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": [ 2160 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": [ 2161 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 2162, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": [ 2163 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2163 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": [ 2164 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 20, 2165, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": [ 2166 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 2166 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": [ 2167 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2167, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": [ 2168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2148, 2168 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": [ 2169 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196830568, 524310, 65536, 0, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 3279 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3279 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3280 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2170 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2105, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2172 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2171, 2172, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": [ 2173 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 2173 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": [ 2174 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2140, 2169, 2174, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.22/self_attn/FusedAttention", "outputIndexes": [ 2175 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2175 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3281 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3281 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3282 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3282 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 197420414, 1048598, 131072, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 3283 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3283 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3284 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3284 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2176 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092, 2176 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_output_0", "outputIndexes": [ 2177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 198600084, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2178 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3285 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3286 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 198608276, 1572886, 196608, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 3287 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3287 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3288 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2179 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2179 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2180 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 200377770, 1572886, 196608, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 3291 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3291 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3292 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2181 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2180, 2181 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": [ 2182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2182 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3293 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3294 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3294 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 202147264, 1572886, 196608, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 3295 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3295 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3296 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3296 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2183 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 2183 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_1_output_0", "outputIndexes": [ 2184 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/Reshape_output_0", "outputIndexes": [ 2185 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 203916758, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2186 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3297 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3297 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3298 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 203924950, 1048598, 131072, 0, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 3299 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3299 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3300 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3300 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2187 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": [ 2188 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2188 ] , "main_type": "NONE", "name": "Shape3506", "outputIndexes": [ 2189 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2188 ] , "main_type": "NONE", "name": "Rank3508", "outputIndexes": [ 2190 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190, 2190 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3510", "outputIndexes": [ 2191 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3511", "outputIndexes": [ 2192 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3513", "outputIndexes": [ 2193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3514", "outputIndexes": [ 2194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2189, 2192, 2194, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3517", "outputIndexes": [ 2195 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2195 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3518", "outputIndexes": [ 2196 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2196, 2196 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3520", "outputIndexes": [ 2197 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 2197, 2191 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": [ 2198 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2199 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3528", "outputIndexes": [ 2200 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3531", "outputIndexes": [ 2201 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2189, 2200, 2201, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3534", "outputIndexes": [ 2202 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2202 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3535", "outputIndexes": [ 2203 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2203 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3536", "outputIndexes": [ 2204 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2204, 2203 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3537", "outputIndexes": [ 2205 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 2205, 2191 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": [ 2206 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2207 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2199, 2207, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": [ 2208 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187, 2208 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": [ 2209 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 205104620, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.23/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2211 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": [ 2212 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": [ 2213 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2213 ] , "main_type": "NONE", "name": "Shape3552", "outputIndexes": [ 2214 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2213 ] , "main_type": "NONE", "name": "Rank3554", "outputIndexes": [ 2215 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215, 2215 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3556", "outputIndexes": [ 2216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2216 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3557", "outputIndexes": [ 2217 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2216, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3559", "outputIndexes": [ 2218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2218 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3560", "outputIndexes": [ 2219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2214, 2217, 2219, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3563", "outputIndexes": [ 2220 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3564", "outputIndexes": [ 2221 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2221 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3565", "outputIndexes": [ 2222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2222, 2221 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3566", "outputIndexes": [ 2223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213, 2223, 2216 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": [ 2224 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2224, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": [ 2225 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2226 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 2226, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": [ 2227 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2227 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": [ 2228 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2229 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 20, 2229, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": [ 2230 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2228, 2230 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": [ 2231 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2231, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": [ 2232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2212, 2232 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": [ 2233 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 205105644, 524310, 65536, 0, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 3303 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3303 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3304 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3304 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2234 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2236 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235, 2236, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": [ 2237 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2234, 2237 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": [ 2238 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 205695490, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.23/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2240 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": [ 2241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": [ 2242 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2242 ] , "main_type": "NONE", "name": "Shape3594", "outputIndexes": [ 2243 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2242 ] , "main_type": "NONE", "name": "Rank3596", "outputIndexes": [ 2244 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244, 2244 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3598", "outputIndexes": [ 2245 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3599", "outputIndexes": [ 2246 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3601", "outputIndexes": [ 2247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2247 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3602", "outputIndexes": [ 2248 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2243, 2246, 2248, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3605", "outputIndexes": [ 2249 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3606", "outputIndexes": [ 2250 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2250 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3607", "outputIndexes": [ 2251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2251, 2250 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3608", "outputIndexes": [ 2252 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2242, 2252, 2245 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": [ 2253 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2253, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": [ 2254 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2254, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2255 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240, 2255, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": [ 2256 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2256 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": [ 2257 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2254, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2258 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240, 20, 2258, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": [ 2259 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257, 2259 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": [ 2260 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2260, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": [ 2261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2241, 2261 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": [ 2262 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 205696514, 524310, 65536, 0, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 3307 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3307 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3308 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3308 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2263 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2264 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2265 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2264, 2265, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": [ 2266 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263, 2266 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": [ 2267 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233, 2262, 2267, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.23/self_attn/FusedAttention", "outputIndexes": [ 2268 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3309 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3309 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3310 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3310 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 206286360, 1048598, 131072, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 3311 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3311 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3312 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3312 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185, 2269 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_output_0", "outputIndexes": [ 2270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 207466030, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2271 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3313 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3313 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3314 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3314 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 207474222, 1572886, 196608, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 3315 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3316 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3316 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2272 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2273 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3314 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 209243716, 1572886, 196608, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 3319 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3319 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3320 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2274 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273, 2274 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": [ 2275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3321 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3321 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3322 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 211013210, 1572886, 196608, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 3323 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3323 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3324 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3324 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2276 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270, 2276 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_1_output_0", "outputIndexes": [ 2277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/Reshape_output_0", "outputIndexes": [ 2278 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2278 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 212782704, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2279 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3325 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3325 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3326 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 212790896, 1048598, 131072, 0, 0 ] } , "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": [ 3327 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3328 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3328 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2280 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": [ 2281 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2281 ] , "main_type": "NONE", "name": "Shape3655", "outputIndexes": [ 2282 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2281 ] , "main_type": "NONE", "name": "Rank3657", "outputIndexes": [ 2283 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2283, 2283 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3659", "outputIndexes": [ 2284 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3660", "outputIndexes": [ 2285 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3662", "outputIndexes": [ 2286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3663", "outputIndexes": [ 2287 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2282, 2285, 2287, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3666", "outputIndexes": [ 2288 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2288 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3667", "outputIndexes": [ 2289 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289, 2289 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3669", "outputIndexes": [ 2290 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281, 2290, 2284 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": [ 2291 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2291, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2292 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3677", "outputIndexes": [ 2293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3680", "outputIndexes": [ 2294 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2282, 2293, 2294, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3683", "outputIndexes": [ 2295 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3684", "outputIndexes": [ 2296 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2296 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3685", "outputIndexes": [ 2297 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 2296 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3686", "outputIndexes": [ 2298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281, 2298, 2284 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": [ 2299 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2300 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 2300, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": [ 2301 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2280, 2301 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": [ 2302 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 213970566, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.24/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2304 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": [ 2305 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": [ 2306 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2306 ] , "main_type": "NONE", "name": "Shape3701", "outputIndexes": [ 2307 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2306 ] , "main_type": "NONE", "name": "Rank3703", "outputIndexes": [ 2308 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308, 2308 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3705", "outputIndexes": [ 2309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3706", "outputIndexes": [ 2310 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3708", "outputIndexes": [ 2311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3709", "outputIndexes": [ 2312 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2307, 2310, 2312, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3712", "outputIndexes": [ 2313 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2313 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3713", "outputIndexes": [ 2314 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2314 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3714", "outputIndexes": [ 2315 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315, 2314 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3715", "outputIndexes": [ 2316 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2306, 2316, 2309 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": [ 2317 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2317, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": [ 2318 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2318, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2319 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304, 2319, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": [ 2320 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2320 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": [ 2321 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2318, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304, 20, 2322, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": [ 2323 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2321, 2323 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": [ 2324 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": [ 2325 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2305, 2325 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": [ 2326 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 213971590, 524310, 65536, 0, 0 ] } , "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": [ 3331 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3332 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3332 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2327 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2291, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2329 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2328, 2329, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": [ 2330 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327, 2330 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": [ 2331 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 214561436, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.24/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2333 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": [ 2334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": [ 2335 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2335 ] , "main_type": "NONE", "name": "Shape3743", "outputIndexes": [ 2336 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2335 ] , "main_type": "NONE", "name": "Rank3745", "outputIndexes": [ 2337 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2337, 2337 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3747", "outputIndexes": [ 2338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3748", "outputIndexes": [ 2339 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3750", "outputIndexes": [ 2340 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3751", "outputIndexes": [ 2341 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336, 2339, 2341, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3754", "outputIndexes": [ 2342 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2342 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3755", "outputIndexes": [ 2343 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2343 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3756", "outputIndexes": [ 2344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2344, 2343 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3757", "outputIndexes": [ 2345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2335, 2345, 2338 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": [ 2346 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2346, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": [ 2347 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2347, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2348 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333, 2348, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": [ 2349 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2349 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": [ 2350 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2347, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333, 20, 2351, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": [ 2352 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350, 2352 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": [ 2353 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2353, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": [ 2354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2334, 2354 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": [ 2355 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 214562460, 524310, 65536, 0, 0 ] } , "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": [ 3335 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3335 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3336 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2356 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2291, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2357 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2358 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2357, 2358, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": [ 2359 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2356, 2359 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": [ 2360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2326, 2355, 2360, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.24/self_attn/FusedAttention", "outputIndexes": [ 2361 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3337 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3337 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3338 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3338 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 215152306, 1048598, 131072, 0, 0 ] } , "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": [ 3339 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3339 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3340 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3340 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2362 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2278, 2362 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_output_0", "outputIndexes": [ 2363 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 216331976, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2364 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3341 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3341 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3342 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 216340168, 1572886, 196608, 0, 0 ] } , "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": [ 3343 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3343 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3344 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2365 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2366 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 218109662, 1572886, 196608, 0, 0 ] } , "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": [ 3347 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3347 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3348 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3348 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2367 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366, 2367 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": [ 2368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3349 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3349 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3350 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3350 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 219879156, 1572886, 196608, 0, 0 ] } , "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": [ 3351 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3351 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3352 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3352 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2369 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 2369 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_1_output_0", "outputIndexes": [ 2370 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/Reshape_output_0", "outputIndexes": [ 2371 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 221648650, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2372 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3353 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3353 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3354 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3354 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 221656842, 1048598, 131072, 0, 0 ] } , "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": [ 3355 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3355 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3356 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3356 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2373 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": [ 2374 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2374 ] , "main_type": "NONE", "name": "Shape3804", "outputIndexes": [ 2375 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2374 ] , "main_type": "NONE", "name": "Rank3806", "outputIndexes": [ 2376 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2376, 2376 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3808", "outputIndexes": [ 2377 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3809", "outputIndexes": [ 2378 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3811", "outputIndexes": [ 2379 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3812", "outputIndexes": [ 2380 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 2378, 2380, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3815", "outputIndexes": [ 2381 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3816", "outputIndexes": [ 2382 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2382, 2382 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3818", "outputIndexes": [ 2383 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2374, 2383, 2377 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": [ 2384 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2385 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3826", "outputIndexes": [ 2386 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3829", "outputIndexes": [ 2387 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2375, 2386, 2387, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3832", "outputIndexes": [ 2388 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2388 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3833", "outputIndexes": [ 2389 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2389 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3834", "outputIndexes": [ 2390 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390, 2389 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3835", "outputIndexes": [ 2391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2374, 2391, 2377 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": [ 2392 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2393 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2385, 2393, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": [ 2394 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 2394 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": [ 2395 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 222836512, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.25/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2397 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": [ 2398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": [ 2399 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2399 ] , "main_type": "NONE", "name": "Shape3850", "outputIndexes": [ 2400 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2399 ] , "main_type": "NONE", "name": "Rank3852", "outputIndexes": [ 2401 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2401, 2401 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3854", "outputIndexes": [ 2402 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2402 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3855", "outputIndexes": [ 2403 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2402, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3857", "outputIndexes": [ 2404 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2404 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3858", "outputIndexes": [ 2405 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2400, 2403, 2405, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3861", "outputIndexes": [ 2406 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3862", "outputIndexes": [ 2407 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2407 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3863", "outputIndexes": [ 2408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408, 2407 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3864", "outputIndexes": [ 2409 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399, 2409, 2402 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": [ 2410 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2410, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": [ 2411 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2412 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 2412, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": [ 2413 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": [ 2414 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2415 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 20, 2415, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": [ 2416 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2414, 2416 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": [ 2417 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2417, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": [ 2418 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2398, 2418 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": [ 2419 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3354 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 222837536, 524310, 65536, 0, 0 ] } , "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": [ 3359 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3359 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3360 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2420 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2421 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2422 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2421, 2422, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": [ 2423 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2420, 2423 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": [ 2424 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 223427382, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.25/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2426 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": [ 2427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": [ 2428 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2428 ] , "main_type": "NONE", "name": "Shape3892", "outputIndexes": [ 2429 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2428 ] , "main_type": "NONE", "name": "Rank3894", "outputIndexes": [ 2430 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2430, 2430 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3896", "outputIndexes": [ 2431 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3897", "outputIndexes": [ 2432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3899", "outputIndexes": [ 2433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2433 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3900", "outputIndexes": [ 2434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2429, 2432, 2434, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3903", "outputIndexes": [ 2435 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2435 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3904", "outputIndexes": [ 2436 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2436 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3905", "outputIndexes": [ 2437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437, 2436 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3906", "outputIndexes": [ 2438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2428, 2438, 2431 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": [ 2439 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": [ 2440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2441 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426, 2441, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": [ 2442 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2442 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": [ 2443 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2444 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426, 20, 2444, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": [ 2445 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443, 2445 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": [ 2446 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2446, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": [ 2447 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427, 2447 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": [ 2448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3354 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 223428406, 524310, 65536, 0, 0 ] } , "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": [ 3363 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3363 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3364 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2451 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450, 2451, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": [ 2452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2449, 2452 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": [ 2453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2419, 2448, 2453, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.25/self_attn/FusedAttention", "outputIndexes": [ 2454 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3365 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3365 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3366 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 224018252, 1048598, 131072, 0, 0 ] } , "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": [ 3367 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3367 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3368 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3368 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371, 2455 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_output_0", "outputIndexes": [ 2456 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 225197922, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2457 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3369 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3369 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3370 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3370 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 225206114, 1572886, 196608, 0, 0 ] } , "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": [ 3371 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3371 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3372 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3372 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2458 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2458 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2459 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3370 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 226975608, 1572886, 196608, 0, 0 ] } , "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": [ 3375 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3375 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3376 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3376 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2460 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2459, 2460 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": [ 2461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3377 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3377 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3378 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3378 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 228745102, 1572886, 196608, 0, 0 ] } , "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": [ 3379 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3379 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3380 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3380 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2462 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456, 2462 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_1_output_0", "outputIndexes": [ 2463 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2463, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/Reshape_output_0", "outputIndexes": [ 2464 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 230514596, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.26/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2465 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3381 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3381 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3382 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3382 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 230522788, 1048598, 131072, 0, 0 ] } , "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": [ 3383 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3383 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3384 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3384 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_output_0", "outputIndexes": [ 2467 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2467 ] , "main_type": "NONE", "name": "Shape3953", "outputIndexes": [ 2468 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2467 ] , "main_type": "NONE", "name": "Rank3955", "outputIndexes": [ 2469 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2469, 2469 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3957", "outputIndexes": [ 2470 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3958", "outputIndexes": [ 2471 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3960", "outputIndexes": [ 2472 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3961", "outputIndexes": [ 2473 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468, 2471, 2473, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3964", "outputIndexes": [ 2474 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2474 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3965", "outputIndexes": [ 2475 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 2475 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3967", "outputIndexes": [ 2476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467, 2476, 2470 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_output_0", "outputIndexes": [ 2477 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2478 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3975", "outputIndexes": [ 2479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3978", "outputIndexes": [ 2480 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468, 2479, 2480, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3981", "outputIndexes": [ 2481 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2481 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3982", "outputIndexes": [ 2482 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2482 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3983", "outputIndexes": [ 2483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483, 2482 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3984", "outputIndexes": [ 2484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467, 2484, 2470 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_1_output_0", "outputIndexes": [ 2485 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 2486, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_output_0", "outputIndexes": [ 2487 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2466, 2487 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_output_0", "outputIndexes": [ 2488 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 231702458, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.26/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2490 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_output_0", "outputIndexes": [ 2491 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_2_output_0", "outputIndexes": [ 2492 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2492 ] , "main_type": "NONE", "name": "Shape3999", "outputIndexes": [ 2493 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2492 ] , "main_type": "NONE", "name": "Rank4001", "outputIndexes": [ 2494 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2494, 2494 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4003", "outputIndexes": [ 2495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4004", "outputIndexes": [ 2496 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4006", "outputIndexes": [ 2497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2497 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4007", "outputIndexes": [ 2498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2493, 2496, 2498, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4010", "outputIndexes": [ 2499 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2499 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4011", "outputIndexes": [ 2500 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2500 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4012", "outputIndexes": [ 2501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501, 2500 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4013", "outputIndexes": [ 2502 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2492, 2502, 2495 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_2_output_0", "outputIndexes": [ 2503 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2503, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_output_0", "outputIndexes": [ 2504 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2505 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490, 2505, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_1_output_0", "outputIndexes": [ 2506 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2506 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_output_0", "outputIndexes": [ 2507 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490, 20, 2508, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_output_0", "outputIndexes": [ 2509 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2507, 2509 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_3_output_0", "outputIndexes": [ 2510 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2510, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_1_output_0", "outputIndexes": [ 2511 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2491, 2511 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_output_0", "outputIndexes": [ 2512 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3382 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 231703482, 524310, 65536, 0, 0 ] } , "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": [ 3387 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3387 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3388 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3388 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2513 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2514 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2514, 2515, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_1_output_0", "outputIndexes": [ 2516 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2513, 2516 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_1_output_0", "outputIndexes": [ 2517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2517 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 232293328, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.26/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2519 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_2_output_0", "outputIndexes": [ 2520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_3_output_0", "outputIndexes": [ 2521 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2521 ] , "main_type": "NONE", "name": "Shape4041", "outputIndexes": [ 2522 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2521 ] , "main_type": "NONE", "name": "Rank4043", "outputIndexes": [ 2523 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523, 2523 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4045", "outputIndexes": [ 2524 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4046", "outputIndexes": [ 2525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4048", "outputIndexes": [ 2526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2526 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4049", "outputIndexes": [ 2527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2522, 2525, 2527, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4052", "outputIndexes": [ 2528 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2528 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4053", "outputIndexes": [ 2529 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2529 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4054", "outputIndexes": [ 2530 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2530, 2529 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4055", "outputIndexes": [ 2531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2521, 2531, 2524 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_3_output_0", "outputIndexes": [ 2532 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_1_output_0", "outputIndexes": [ 2533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2534 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519, 2534, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_3_output_0", "outputIndexes": [ 2535 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2535 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_1_output_0", "outputIndexes": [ 2536 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2537 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519, 20, 2537, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_2_output_0", "outputIndexes": [ 2538 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536, 2538 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_4_output_0", "outputIndexes": [ 2539 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_3_output_0", "outputIndexes": [ 2540 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2520, 2540 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_1_output_0", "outputIndexes": [ 2541 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3382 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 232294352, 524310, 65536, 0, 0 ] } , "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": [ 3391 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3392 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3392 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2542 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2543 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2544 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2544, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_2_output_0", "outputIndexes": [ 2545 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2542, 2545 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_2_output_0", "outputIndexes": [ 2546 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2512, 2541, 2546, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.26/self_attn/FusedAttention", "outputIndexes": [ 2547 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2547 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3393 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3393 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3394 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3394 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 232884198, 1048598, 131072, 0, 0 ] } , "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": [ 3395 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3395 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3396 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3396 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2548 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464, 2548 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_output_0", "outputIndexes": [ 2549 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 234063868, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.26/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2550 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2550 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3397 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3397 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3398 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3398 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 234072060, 1572886, 196608, 0, 0 ] } , "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": [ 3399 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3399 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3400 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2551 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.26/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2552 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3398 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 235841554, 1572886, 196608, 0, 0 ] } , "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": [ 3403 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3403 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3404 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2553 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2552, 2553 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/mlp/Mul_output_0", "outputIndexes": [ 2554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2554 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3405 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3405 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3406 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3406 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 237611048, 1572886, 196608, 0, 0 ] } , "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": [ 3407 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3407 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3408 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3408 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549, 2555 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_1_output_0", "outputIndexes": [ 2556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2556, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/Reshape_output_0", "outputIndexes": [ 2557 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 239380542, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.27/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2558 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2558 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3409 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3410 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3410 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2048, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 239388734, 1048598, 131072, 0, 0 ] } , "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": [ 3411 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3411 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3412 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3412 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2048 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2558 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_output_0", "outputIndexes": [ 2560 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2560 ] , "main_type": "NONE", "name": "Shape4102", "outputIndexes": [ 2561 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2560 ] , "main_type": "NONE", "name": "Rank4104", "outputIndexes": [ 2562 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562, 2562 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4106", "outputIndexes": [ 2563 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4107", "outputIndexes": [ 2564 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4109", "outputIndexes": [ 2565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4110", "outputIndexes": [ 2566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561, 2564, 2566, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4113", "outputIndexes": [ 2567 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4114", "outputIndexes": [ 2568 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2568, 2568 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4116", "outputIndexes": [ 2569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2560, 2569, 2563 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_output_0", "outputIndexes": [ 2570 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2570, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2571 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4124", "outputIndexes": [ 2572 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4127", "outputIndexes": [ 2573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561, 2572, 2573, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4130", "outputIndexes": [ 2574 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2574 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4131", "outputIndexes": [ 2575 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2575 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4132", "outputIndexes": [ 2576 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576, 2575 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4133", "outputIndexes": [ 2577 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2560, 2577, 2563 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_1_output_0", "outputIndexes": [ 2578 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2579 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2571, 2579, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_output_0", "outputIndexes": [ 2580 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559, 2580 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_output_0", "outputIndexes": [ 2581 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 240568404, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.27/self_attn/q_norm/Mul_1_output_0", "outputIndexes": [ 2583 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_output_0", "outputIndexes": [ 2584 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_2_output_0", "outputIndexes": [ 2585 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2585 ] , "main_type": "NONE", "name": "Shape4148", "outputIndexes": [ 2586 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2585 ] , "main_type": "NONE", "name": "Rank4150", "outputIndexes": [ 2587 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587, 2587 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4152", "outputIndexes": [ 2588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4153", "outputIndexes": [ 2589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2588, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4155", "outputIndexes": [ 2590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4156", "outputIndexes": [ 2591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2586, 2589, 2591, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4159", "outputIndexes": [ 2592 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4160", "outputIndexes": [ 2593 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2593 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4161", "outputIndexes": [ 2594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 2593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4162", "outputIndexes": [ 2595 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585, 2595, 2588 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_2_output_0", "outputIndexes": [ 2596 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2596, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_output_0", "outputIndexes": [ 2597 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2598 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583, 2598, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_1_output_0", "outputIndexes": [ 2599 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2599 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_output_0", "outputIndexes": [ 2600 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2601 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583, 20, 2601, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_output_0", "outputIndexes": [ 2602 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2600, 2602 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_3_output_0", "outputIndexes": [ 2603 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2603, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_1_output_0", "outputIndexes": [ 2604 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584, 2604 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_output_0", "outputIndexes": [ 2605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3410 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 240569428, 524310, 65536, 0, 0 ] } , "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": [ 3415 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3416 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3416 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2570, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2608 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607, 2608, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_1_output_0", "outputIndexes": [ 2609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2606, 2609 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_1_output_0", "outputIndexes": [ 2610 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2610 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 241159274, 512, 512 ] , "useRMSNorm": true } , "name": "/blocks.27/self_attn/k_norm/Mul_1_output_0", "outputIndexes": [ 2612 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612, 59 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_2_output_0", "outputIndexes": [ 2613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_3_output_0", "outputIndexes": [ 2614 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2614 ] , "main_type": "NONE", "name": "Shape4190", "outputIndexes": [ 2615 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2614 ] , "main_type": "NONE", "name": "Rank4192", "outputIndexes": [ 2616 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2616, 2616 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4194", "outputIndexes": [ 2617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4195", "outputIndexes": [ 2618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4197", "outputIndexes": [ 2619 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4198", "outputIndexes": [ 2620 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2615, 2618, 2620, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4201", "outputIndexes": [ 2621 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4202", "outputIndexes": [ 2622 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 2622 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4203", "outputIndexes": [ 2623 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2623, 2622 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4204", "outputIndexes": [ 2624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2614, 2624, 2617 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_3_output_0", "outputIndexes": [ 2625 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2625, 74 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_1_output_0", "outputIndexes": [ 2626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2627 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612, 2627, 77, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_3_output_0", "outputIndexes": [ 2628 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2628 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_1_output_0", "outputIndexes": [ 2629 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2630 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612, 20, 2630, 78, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_2_output_0", "outputIndexes": [ 2631 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 2631 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_4_output_0", "outputIndexes": [ 2632 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2632, 90 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_3_output_0", "outputIndexes": [ 2633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2613, 2633 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_1_output_0", "outputIndexes": [ 2634 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3410 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 8192, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 241160298, 524310, 65536, 0, 0 ] } , "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": [ 3419 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3419 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3420 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2635 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2570, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2637 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2636, 2637, 96, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_2_output_0", "outputIndexes": [ 2638 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635, 2638 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_2_output_0", "outputIndexes": [ 2639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605, 2634, 2639, 128 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.27/self_attn/FusedAttention", "outputIndexes": [ 2640 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2048, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3421 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3421 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3422 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3422 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2048, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 16384, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 241750144, 1048598, 131072, 0, 0 ] } , "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": [ 3423 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3423 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3424 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3424 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2641 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557, 2641 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_output_0", "outputIndexes": [ 2642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 242929814, 4096, 4096 ] , "useRMSNorm": true } , "name": "/blocks.27/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2643 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2643 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3425 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3425 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3426 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 242938006, 1572886, 196608, 0, 0 ] } , "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": [ 3427 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3427 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3428 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3428 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2644 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2644 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.27/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2645 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 3072, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 244707500, 1572886, 196608, 0, 0 ] } , "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": [ 3431 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3431 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3432 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 3072 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2645, 2646 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/mlp/Mul_output_0", "outputIndexes": [ 2647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2647 ] , "main_type": "Reshape", "main": { "dims": [ -1, 3072, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3433 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3433 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3434 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3434 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 3072, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 24576, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 246476994, 1572886, 196608, 0, 0 ] } , "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": [ 3435 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3436 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3436 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 2648 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_1_output_0", "outputIndexes": [ 2649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649, 1, 77, 15, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 2650 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 248246488, 4096, 4096 ] , "useRMSNorm": true } , "name": "hidden_states", "outputIndexes": [ 2651 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1024, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 3437 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3437 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 3438 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3438 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 151936, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1215488, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 248254680, 77791258, 9723904, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 3439 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3439 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 3440 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3440 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 151936 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 2652 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "hidden_states" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "position_ids", "logits_index", "input_ids", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape22", "Rank24", "BinaryOp26", "Unsqueeze27", "Const28", "BinaryOp29", "Unsqueeze30", "Unsqueeze32", "StridedSlice33", "Squeeze34", "BinaryOp36", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_3_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze46", "Unsqueeze49", "StridedSlice52", "Squeeze53", "BinaryOp54", "BinaryOp55", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_2_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/blocks.0/self_attn/q_norm/Cast_output_0", "/blocks.0/self_attn/q_norm/Mul_1_output_0", "/rotary/Cast_output_0", "/rotary/Constant_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_1_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_5_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape85", "Rank87", "BinaryOp89", "Unsqueeze90", "BinaryOp92", "Unsqueeze93", "StridedSlice96", "Squeeze97", "BinaryOp99", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_8_output_0", "Shape104", "Rank106", "BinaryOp108", "Unsqueeze109", "BinaryOp111", "Unsqueeze112", "StridedSlice115", "Squeeze116", "BinaryOp117", "BinaryOp118", "/blocks.0/self_attn/Gather_4_output_0", "/blocks.0/self_attn/Constant_9_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_16_output_0", "/blocks.0/self_attn/Constant_10_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze136", "Unsqueeze139", "StridedSlice142", "Squeeze143", "BinaryOp144", "BinaryOp145", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/k_norm/Cast_output_0", "/blocks.0/self_attn/k_norm/Mul_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape166", "Rank168", "BinaryOp170", "Unsqueeze171", "BinaryOp173", "Unsqueeze174", "StridedSlice177", "Squeeze178", "BinaryOp179", "BinaryOp180", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "/blocks.0/self_attn/fused_attn/FusedAttention_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/Add_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape228", "Rank230", "BinaryOp232", "Unsqueeze233", "BinaryOp235", "Unsqueeze236", "StridedSlice239", "Squeeze240", "BinaryOp242", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze250", "Unsqueeze253", "StridedSlice256", "Squeeze257", "BinaryOp258", "BinaryOp259", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/q_norm/Cast_output_0", "/blocks.1/self_attn/q_norm/Mul_1_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape274", "Rank276", "BinaryOp278", "Unsqueeze279", "BinaryOp281", "Unsqueeze282", "StridedSlice285", "Squeeze286", "BinaryOp287", "BinaryOp288", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/k_norm/Cast_output_0", "/blocks.1/self_attn/k_norm/Mul_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape316", "Rank318", "BinaryOp320", "Unsqueeze321", "BinaryOp323", "Unsqueeze324", "StridedSlice327", "Squeeze328", "BinaryOp329", "BinaryOp330", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "/blocks.1/self_attn/fused_attn/FusedAttention_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/Add_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape377", "Rank379", "BinaryOp381", "Unsqueeze382", "BinaryOp384", "Unsqueeze385", "StridedSlice388", "Squeeze389", "BinaryOp391", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze399", "Unsqueeze402", "StridedSlice405", "Squeeze406", "BinaryOp407", "BinaryOp408", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/q_norm/Cast_output_0", "/blocks.2/self_attn/q_norm/Mul_1_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape423", "Rank425", "BinaryOp427", "Unsqueeze428", "BinaryOp430", "Unsqueeze431", "StridedSlice434", "Squeeze435", "BinaryOp436", "BinaryOp437", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/k_norm/Cast_output_0", "/blocks.2/self_attn/k_norm/Mul_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape465", "Rank467", "BinaryOp469", "Unsqueeze470", "BinaryOp472", "Unsqueeze473", "StridedSlice476", "Squeeze477", "BinaryOp478", "BinaryOp479", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "/blocks.2/self_attn/fused_attn/FusedAttention_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/Add_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape526", "Rank528", "BinaryOp530", "Unsqueeze531", "BinaryOp533", "Unsqueeze534", "StridedSlice537", "Squeeze538", "BinaryOp540", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze548", "Unsqueeze551", "StridedSlice554", "Squeeze555", "BinaryOp556", "BinaryOp557", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/q_norm/Cast_output_0", "/blocks.3/self_attn/q_norm/Mul_1_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape572", "Rank574", "BinaryOp576", "Unsqueeze577", "BinaryOp579", "Unsqueeze580", "StridedSlice583", "Squeeze584", "BinaryOp585", "BinaryOp586", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/k_norm/Cast_output_0", "/blocks.3/self_attn/k_norm/Mul_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape614", "Rank616", "BinaryOp618", "Unsqueeze619", "BinaryOp621", "Unsqueeze622", "StridedSlice625", "Squeeze626", "BinaryOp627", "BinaryOp628", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "/blocks.3/self_attn/fused_attn/FusedAttention_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/Add_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape675", "Rank677", "BinaryOp679", "Unsqueeze680", "BinaryOp682", "Unsqueeze683", "StridedSlice686", "Squeeze687", "BinaryOp689", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze697", "Unsqueeze700", "StridedSlice703", "Squeeze704", "BinaryOp705", "BinaryOp706", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/q_norm/Cast_output_0", "/blocks.4/self_attn/q_norm/Mul_1_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape721", "Rank723", "BinaryOp725", "Unsqueeze726", "BinaryOp728", "Unsqueeze729", "StridedSlice732", "Squeeze733", "BinaryOp734", "BinaryOp735", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/k_norm/Cast_output_0", "/blocks.4/self_attn/k_norm/Mul_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape763", "Rank765", "BinaryOp767", "Unsqueeze768", "BinaryOp770", "Unsqueeze771", "StridedSlice774", "Squeeze775", "BinaryOp776", "BinaryOp777", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "/blocks.4/self_attn/fused_attn/FusedAttention_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/Add_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape824", "Rank826", "BinaryOp828", "Unsqueeze829", "BinaryOp831", "Unsqueeze832", "StridedSlice835", "Squeeze836", "BinaryOp838", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze846", "Unsqueeze849", "StridedSlice852", "Squeeze853", "BinaryOp854", "BinaryOp855", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/q_norm/Cast_output_0", "/blocks.5/self_attn/q_norm/Mul_1_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape870", "Rank872", "BinaryOp874", "Unsqueeze875", "BinaryOp877", "Unsqueeze878", "StridedSlice881", "Squeeze882", "BinaryOp883", "BinaryOp884", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/k_norm/Cast_output_0", "/blocks.5/self_attn/k_norm/Mul_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape912", "Rank914", "BinaryOp916", "Unsqueeze917", "BinaryOp919", "Unsqueeze920", "StridedSlice923", "Squeeze924", "BinaryOp925", "BinaryOp926", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "/blocks.5/self_attn/fused_attn/FusedAttention_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/Add_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape973", "Rank975", "BinaryOp977", "Unsqueeze978", "BinaryOp980", "Unsqueeze981", "StridedSlice984", "Squeeze985", "BinaryOp987", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze995", "Unsqueeze998", "StridedSlice1001", "Squeeze1002", "BinaryOp1003", "BinaryOp1004", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/q_norm/Cast_output_0", "/blocks.6/self_attn/q_norm/Mul_1_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape1019", "Rank1021", "BinaryOp1023", "Unsqueeze1024", "BinaryOp1026", "Unsqueeze1027", "StridedSlice1030", "Squeeze1031", "BinaryOp1032", "BinaryOp1033", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/k_norm/Cast_output_0", "/blocks.6/self_attn/k_norm/Mul_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape1061", "Rank1063", "BinaryOp1065", "Unsqueeze1066", "BinaryOp1068", "Unsqueeze1069", "StridedSlice1072", "Squeeze1073", "BinaryOp1074", "BinaryOp1075", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "/blocks.6/self_attn/fused_attn/FusedAttention_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/Add_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape1122", "Rank1124", "BinaryOp1126", "Unsqueeze1127", "BinaryOp1129", "Unsqueeze1130", "StridedSlice1133", "Squeeze1134", "BinaryOp1136", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze1144", "Unsqueeze1147", "StridedSlice1150", "Squeeze1151", "BinaryOp1152", "BinaryOp1153", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/q_norm/Cast_output_0", "/blocks.7/self_attn/q_norm/Mul_1_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape1168", "Rank1170", "BinaryOp1172", "Unsqueeze1173", "BinaryOp1175", "Unsqueeze1176", "StridedSlice1179", "Squeeze1180", "BinaryOp1181", "BinaryOp1182", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/k_norm/Cast_output_0", "/blocks.7/self_attn/k_norm/Mul_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape1210", "Rank1212", "BinaryOp1214", "Unsqueeze1215", "BinaryOp1217", "Unsqueeze1218", "StridedSlice1221", "Squeeze1222", "BinaryOp1223", "BinaryOp1224", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "/blocks.7/self_attn/fused_attn/FusedAttention_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/Add_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape1271", "Rank1273", "BinaryOp1275", "Unsqueeze1276", "BinaryOp1278", "Unsqueeze1279", "StridedSlice1282", "Squeeze1283", "BinaryOp1285", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze1293", "Unsqueeze1296", "StridedSlice1299", "Squeeze1300", "BinaryOp1301", "BinaryOp1302", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/q_norm/Cast_output_0", "/blocks.8/self_attn/q_norm/Mul_1_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape1317", "Rank1319", "BinaryOp1321", "Unsqueeze1322", "BinaryOp1324", "Unsqueeze1325", "StridedSlice1328", "Squeeze1329", "BinaryOp1330", "BinaryOp1331", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/k_norm/Cast_output_0", "/blocks.8/self_attn/k_norm/Mul_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape1359", "Rank1361", "BinaryOp1363", "Unsqueeze1364", "BinaryOp1366", "Unsqueeze1367", "StridedSlice1370", "Squeeze1371", "BinaryOp1372", "BinaryOp1373", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "/blocks.8/self_attn/fused_attn/FusedAttention_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/Add_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape1420", "Rank1422", "BinaryOp1424", "Unsqueeze1425", "BinaryOp1427", "Unsqueeze1428", "StridedSlice1431", "Squeeze1432", "BinaryOp1434", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze1442", "Unsqueeze1445", "StridedSlice1448", "Squeeze1449", "BinaryOp1450", "BinaryOp1451", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/q_norm/Cast_output_0", "/blocks.9/self_attn/q_norm/Mul_1_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape1466", "Rank1468", "BinaryOp1470", "Unsqueeze1471", "BinaryOp1473", "Unsqueeze1474", "StridedSlice1477", "Squeeze1478", "BinaryOp1479", "BinaryOp1480", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/k_norm/Cast_output_0", "/blocks.9/self_attn/k_norm/Mul_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape1508", "Rank1510", "BinaryOp1512", "Unsqueeze1513", "BinaryOp1515", "Unsqueeze1516", "StridedSlice1519", "Squeeze1520", "BinaryOp1521", "BinaryOp1522", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "/blocks.9/self_attn/fused_attn/FusedAttention_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/Add_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape1569", "Rank1571", "BinaryOp1573", "Unsqueeze1574", "BinaryOp1576", "Unsqueeze1577", "StridedSlice1580", "Squeeze1581", "BinaryOp1583", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze1591", "Unsqueeze1594", "StridedSlice1597", "Squeeze1598", "BinaryOp1599", "BinaryOp1600", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/q_norm/Cast_output_0", "/blocks.10/self_attn/q_norm/Mul_1_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape1615", "Rank1617", "BinaryOp1619", "Unsqueeze1620", "BinaryOp1622", "Unsqueeze1623", "StridedSlice1626", "Squeeze1627", "BinaryOp1628", "BinaryOp1629", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/k_norm/Cast_output_0", "/blocks.10/self_attn/k_norm/Mul_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape1657", "Rank1659", "BinaryOp1661", "Unsqueeze1662", "BinaryOp1664", "Unsqueeze1665", "StridedSlice1668", "Squeeze1669", "BinaryOp1670", "BinaryOp1671", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "/blocks.10/self_attn/fused_attn/FusedAttention_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/Add_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape1718", "Rank1720", "BinaryOp1722", "Unsqueeze1723", "BinaryOp1725", "Unsqueeze1726", "StridedSlice1729", "Squeeze1730", "BinaryOp1732", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze1740", "Unsqueeze1743", "StridedSlice1746", "Squeeze1747", "BinaryOp1748", "BinaryOp1749", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/q_norm/Cast_output_0", "/blocks.11/self_attn/q_norm/Mul_1_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape1764", "Rank1766", "BinaryOp1768", "Unsqueeze1769", "BinaryOp1771", "Unsqueeze1772", "StridedSlice1775", "Squeeze1776", "BinaryOp1777", "BinaryOp1778", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/k_norm/Cast_output_0", "/blocks.11/self_attn/k_norm/Mul_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape1806", "Rank1808", "BinaryOp1810", "Unsqueeze1811", "BinaryOp1813", "Unsqueeze1814", "StridedSlice1817", "Squeeze1818", "BinaryOp1819", "BinaryOp1820", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "/blocks.11/self_attn/fused_attn/FusedAttention_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/Add_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape1867", "Rank1869", "BinaryOp1871", "Unsqueeze1872", "BinaryOp1874", "Unsqueeze1875", "StridedSlice1878", "Squeeze1879", "BinaryOp1881", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze1889", "Unsqueeze1892", "StridedSlice1895", "Squeeze1896", "BinaryOp1897", "BinaryOp1898", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/q_norm/Cast_output_0", "/blocks.12/self_attn/q_norm/Mul_1_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape1913", "Rank1915", "BinaryOp1917", "Unsqueeze1918", "BinaryOp1920", "Unsqueeze1921", "StridedSlice1924", "Squeeze1925", "BinaryOp1926", "BinaryOp1927", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/k_norm/Cast_output_0", "/blocks.12/self_attn/k_norm/Mul_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape1955", "Rank1957", "BinaryOp1959", "Unsqueeze1960", "BinaryOp1962", "Unsqueeze1963", "StridedSlice1966", "Squeeze1967", "BinaryOp1968", "BinaryOp1969", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "/blocks.12/self_attn/fused_attn/FusedAttention_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/Add_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape2016", "Rank2018", "BinaryOp2020", "Unsqueeze2021", "BinaryOp2023", "Unsqueeze2024", "StridedSlice2027", "Squeeze2028", "BinaryOp2030", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze2038", "Unsqueeze2041", "StridedSlice2044", "Squeeze2045", "BinaryOp2046", "BinaryOp2047", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/q_norm/Cast_output_0", "/blocks.13/self_attn/q_norm/Mul_1_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape2062", "Rank2064", "BinaryOp2066", "Unsqueeze2067", "BinaryOp2069", "Unsqueeze2070", "StridedSlice2073", "Squeeze2074", "BinaryOp2075", "BinaryOp2076", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/k_norm/Cast_output_0", "/blocks.13/self_attn/k_norm/Mul_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape2104", "Rank2106", "BinaryOp2108", "Unsqueeze2109", "BinaryOp2111", "Unsqueeze2112", "StridedSlice2115", "Squeeze2116", "BinaryOp2117", "BinaryOp2118", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "/blocks.13/self_attn/fused_attn/FusedAttention_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/Add_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape2165", "Rank2167", "BinaryOp2169", "Unsqueeze2170", "BinaryOp2172", "Unsqueeze2173", "StridedSlice2176", "Squeeze2177", "BinaryOp2179", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze2187", "Unsqueeze2190", "StridedSlice2193", "Squeeze2194", "BinaryOp2195", "BinaryOp2196", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/q_norm/Cast_output_0", "/blocks.14/self_attn/q_norm/Mul_1_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape2211", "Rank2213", "BinaryOp2215", "Unsqueeze2216", "BinaryOp2218", "Unsqueeze2219", "StridedSlice2222", "Squeeze2223", "BinaryOp2224", "BinaryOp2225", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/k_norm/Cast_output_0", "/blocks.14/self_attn/k_norm/Mul_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape2253", "Rank2255", "BinaryOp2257", "Unsqueeze2258", "BinaryOp2260", "Unsqueeze2261", "StridedSlice2264", "Squeeze2265", "BinaryOp2266", "BinaryOp2267", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "/blocks.14/self_attn/fused_attn/FusedAttention_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/Add_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape2314", "Rank2316", "BinaryOp2318", "Unsqueeze2319", "BinaryOp2321", "Unsqueeze2322", "StridedSlice2325", "Squeeze2326", "BinaryOp2328", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze2336", "Unsqueeze2339", "StridedSlice2342", "Squeeze2343", "BinaryOp2344", "BinaryOp2345", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/q_norm/Cast_output_0", "/blocks.15/self_attn/q_norm/Mul_1_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape2360", "Rank2362", "BinaryOp2364", "Unsqueeze2365", "BinaryOp2367", "Unsqueeze2368", "StridedSlice2371", "Squeeze2372", "BinaryOp2373", "BinaryOp2374", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/k_norm/Cast_output_0", "/blocks.15/self_attn/k_norm/Mul_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape2402", "Rank2404", "BinaryOp2406", "Unsqueeze2407", "BinaryOp2409", "Unsqueeze2410", "StridedSlice2413", "Squeeze2414", "BinaryOp2415", "BinaryOp2416", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "/blocks.15/self_attn/fused_attn/FusedAttention_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/Add_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape2463", "Rank2465", "BinaryOp2467", "Unsqueeze2468", "BinaryOp2470", "Unsqueeze2471", "StridedSlice2474", "Squeeze2475", "BinaryOp2477", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze2485", "Unsqueeze2488", "StridedSlice2491", "Squeeze2492", "BinaryOp2493", "BinaryOp2494", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/q_norm/Cast_output_0", "/blocks.16/self_attn/q_norm/Mul_1_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape2509", "Rank2511", "BinaryOp2513", "Unsqueeze2514", "BinaryOp2516", "Unsqueeze2517", "StridedSlice2520", "Squeeze2521", "BinaryOp2522", "BinaryOp2523", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/k_norm/Cast_output_0", "/blocks.16/self_attn/k_norm/Mul_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape2551", "Rank2553", "BinaryOp2555", "Unsqueeze2556", "BinaryOp2558", "Unsqueeze2559", "StridedSlice2562", "Squeeze2563", "BinaryOp2564", "BinaryOp2565", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "/blocks.16/self_attn/fused_attn/FusedAttention_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/Add_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape2612", "Rank2614", "BinaryOp2616", "Unsqueeze2617", "BinaryOp2619", "Unsqueeze2620", "StridedSlice2623", "Squeeze2624", "BinaryOp2626", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze2634", "Unsqueeze2637", "StridedSlice2640", "Squeeze2641", "BinaryOp2642", "BinaryOp2643", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/q_norm/Cast_output_0", "/blocks.17/self_attn/q_norm/Mul_1_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape2658", "Rank2660", "BinaryOp2662", "Unsqueeze2663", "BinaryOp2665", "Unsqueeze2666", "StridedSlice2669", "Squeeze2670", "BinaryOp2671", "BinaryOp2672", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/k_norm/Cast_output_0", "/blocks.17/self_attn/k_norm/Mul_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape2700", "Rank2702", "BinaryOp2704", "Unsqueeze2705", "BinaryOp2707", "Unsqueeze2708", "StridedSlice2711", "Squeeze2712", "BinaryOp2713", "BinaryOp2714", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "/blocks.17/self_attn/fused_attn/FusedAttention_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/Add_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape2761", "Rank2763", "BinaryOp2765", "Unsqueeze2766", "BinaryOp2768", "Unsqueeze2769", "StridedSlice2772", "Squeeze2773", "BinaryOp2775", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze2783", "Unsqueeze2786", "StridedSlice2789", "Squeeze2790", "BinaryOp2791", "BinaryOp2792", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/q_norm/Cast_output_0", "/blocks.18/self_attn/q_norm/Mul_1_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape2807", "Rank2809", "BinaryOp2811", "Unsqueeze2812", "BinaryOp2814", "Unsqueeze2815", "StridedSlice2818", "Squeeze2819", "BinaryOp2820", "BinaryOp2821", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/k_norm/Cast_output_0", "/blocks.18/self_attn/k_norm/Mul_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape2849", "Rank2851", "BinaryOp2853", "Unsqueeze2854", "BinaryOp2856", "Unsqueeze2857", "StridedSlice2860", "Squeeze2861", "BinaryOp2862", "BinaryOp2863", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "/blocks.18/self_attn/fused_attn/FusedAttention_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/Add_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape2910", "Rank2912", "BinaryOp2914", "Unsqueeze2915", "BinaryOp2917", "Unsqueeze2918", "StridedSlice2921", "Squeeze2922", "BinaryOp2924", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze2932", "Unsqueeze2935", "StridedSlice2938", "Squeeze2939", "BinaryOp2940", "BinaryOp2941", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/q_norm/Cast_output_0", "/blocks.19/self_attn/q_norm/Mul_1_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape2956", "Rank2958", "BinaryOp2960", "Unsqueeze2961", "BinaryOp2963", "Unsqueeze2964", "StridedSlice2967", "Squeeze2968", "BinaryOp2969", "BinaryOp2970", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/k_norm/Cast_output_0", "/blocks.19/self_attn/k_norm/Mul_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape2998", "Rank3000", "BinaryOp3002", "Unsqueeze3003", "BinaryOp3005", "Unsqueeze3006", "StridedSlice3009", "Squeeze3010", "BinaryOp3011", "BinaryOp3012", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "/blocks.19/self_attn/fused_attn/FusedAttention_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/Add_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape3059", "Rank3061", "BinaryOp3063", "Unsqueeze3064", "BinaryOp3066", "Unsqueeze3067", "StridedSlice3070", "Squeeze3071", "BinaryOp3073", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze3081", "Unsqueeze3084", "StridedSlice3087", "Squeeze3088", "BinaryOp3089", "BinaryOp3090", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/q_norm/Cast_output_0", "/blocks.20/self_attn/q_norm/Mul_1_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape3105", "Rank3107", "BinaryOp3109", "Unsqueeze3110", "BinaryOp3112", "Unsqueeze3113", "StridedSlice3116", "Squeeze3117", "BinaryOp3118", "BinaryOp3119", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/k_norm/Cast_output_0", "/blocks.20/self_attn/k_norm/Mul_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape3147", "Rank3149", "BinaryOp3151", "Unsqueeze3152", "BinaryOp3154", "Unsqueeze3155", "StridedSlice3158", "Squeeze3159", "BinaryOp3160", "BinaryOp3161", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "/blocks.20/self_attn/fused_attn/FusedAttention_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/Add_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape3208", "Rank3210", "BinaryOp3212", "Unsqueeze3213", "BinaryOp3215", "Unsqueeze3216", "StridedSlice3219", "Squeeze3220", "BinaryOp3222", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze3230", "Unsqueeze3233", "StridedSlice3236", "Squeeze3237", "BinaryOp3238", "BinaryOp3239", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/q_norm/Cast_output_0", "/blocks.21/self_attn/q_norm/Mul_1_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape3254", "Rank3256", "BinaryOp3258", "Unsqueeze3259", "BinaryOp3261", "Unsqueeze3262", "StridedSlice3265", "Squeeze3266", "BinaryOp3267", "BinaryOp3268", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/k_norm/Cast_output_0", "/blocks.21/self_attn/k_norm/Mul_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape3296", "Rank3298", "BinaryOp3300", "Unsqueeze3301", "BinaryOp3303", "Unsqueeze3304", "StridedSlice3307", "Squeeze3308", "BinaryOp3309", "BinaryOp3310", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "/blocks.21/self_attn/fused_attn/FusedAttention_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/Add_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape3357", "Rank3359", "BinaryOp3361", "Unsqueeze3362", "BinaryOp3364", "Unsqueeze3365", "StridedSlice3368", "Squeeze3369", "BinaryOp3371", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze3379", "Unsqueeze3382", "StridedSlice3385", "Squeeze3386", "BinaryOp3387", "BinaryOp3388", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/q_norm/Cast_output_0", "/blocks.22/self_attn/q_norm/Mul_1_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape3403", "Rank3405", "BinaryOp3407", "Unsqueeze3408", "BinaryOp3410", "Unsqueeze3411", "StridedSlice3414", "Squeeze3415", "BinaryOp3416", "BinaryOp3417", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/k_norm/Cast_output_0", "/blocks.22/self_attn/k_norm/Mul_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape3445", "Rank3447", "BinaryOp3449", "Unsqueeze3450", "BinaryOp3452", "Unsqueeze3453", "StridedSlice3456", "Squeeze3457", "BinaryOp3458", "BinaryOp3459", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "/blocks.22/self_attn/fused_attn/FusedAttention_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/Add_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape3506", "Rank3508", "BinaryOp3510", "Unsqueeze3511", "BinaryOp3513", "Unsqueeze3514", "StridedSlice3517", "Squeeze3518", "BinaryOp3520", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze3528", "Unsqueeze3531", "StridedSlice3534", "Squeeze3535", "BinaryOp3536", "BinaryOp3537", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/q_norm/Cast_output_0", "/blocks.23/self_attn/q_norm/Mul_1_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape3552", "Rank3554", "BinaryOp3556", "Unsqueeze3557", "BinaryOp3559", "Unsqueeze3560", "StridedSlice3563", "Squeeze3564", "BinaryOp3565", "BinaryOp3566", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/k_norm/Cast_output_0", "/blocks.23/self_attn/k_norm/Mul_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape3594", "Rank3596", "BinaryOp3598", "Unsqueeze3599", "BinaryOp3601", "Unsqueeze3602", "StridedSlice3605", "Squeeze3606", "BinaryOp3607", "BinaryOp3608", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "/blocks.23/self_attn/fused_attn/FusedAttention_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/Add_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape3655", "Rank3657", "BinaryOp3659", "Unsqueeze3660", "BinaryOp3662", "Unsqueeze3663", "StridedSlice3666", "Squeeze3667", "BinaryOp3669", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze3677", "Unsqueeze3680", "StridedSlice3683", "Squeeze3684", "BinaryOp3685", "BinaryOp3686", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/q_norm/Cast_output_0", "/blocks.24/self_attn/q_norm/Mul_1_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape3701", "Rank3703", "BinaryOp3705", "Unsqueeze3706", "BinaryOp3708", "Unsqueeze3709", "StridedSlice3712", "Squeeze3713", "BinaryOp3714", "BinaryOp3715", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/k_norm/Cast_output_0", "/blocks.24/self_attn/k_norm/Mul_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape3743", "Rank3745", "BinaryOp3747", "Unsqueeze3748", "BinaryOp3750", "Unsqueeze3751", "StridedSlice3754", "Squeeze3755", "BinaryOp3756", "BinaryOp3757", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "/blocks.24/self_attn/fused_attn/FusedAttention_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/Add_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape3804", "Rank3806", "BinaryOp3808", "Unsqueeze3809", "BinaryOp3811", "Unsqueeze3812", "StridedSlice3815", "Squeeze3816", "BinaryOp3818", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze3826", "Unsqueeze3829", "StridedSlice3832", "Squeeze3833", "BinaryOp3834", "BinaryOp3835", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/q_norm/Cast_output_0", "/blocks.25/self_attn/q_norm/Mul_1_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape3850", "Rank3852", "BinaryOp3854", "Unsqueeze3855", "BinaryOp3857", "Unsqueeze3858", "StridedSlice3861", "Squeeze3862", "BinaryOp3863", "BinaryOp3864", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/k_norm/Cast_output_0", "/blocks.25/self_attn/k_norm/Mul_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape3892", "Rank3894", "BinaryOp3896", "Unsqueeze3897", "BinaryOp3899", "Unsqueeze3900", "StridedSlice3903", "Squeeze3904", "BinaryOp3905", "BinaryOp3906", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "/blocks.25/self_attn/fused_attn/FusedAttention_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/Add_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/Add_1_output_0", "/blocks.26/Reshape_output_0", "/blocks.26/input_layernorm/Mul_1_output_0", "/blocks.26/self_attn/q_proj/FakeLinear_output_0", "/blocks.26/self_attn/Shape_output_0", "Shape3953", "Rank3955", "BinaryOp3957", "Unsqueeze3958", "BinaryOp3960", "Unsqueeze3961", "StridedSlice3964", "Squeeze3965", "BinaryOp3967", "/blocks.26/self_attn/Gather_output_0", "/blocks.26/self_attn/Unsqueeze_output_0", "Unsqueeze3975", "Unsqueeze3978", "StridedSlice3981", "Squeeze3982", "BinaryOp3983", "BinaryOp3984", "/blocks.26/self_attn/Gather_1_output_0", "/blocks.26/self_attn/Unsqueeze_1_output_0", "/blocks.26/self_attn/Concat_output_0", "/blocks.26/self_attn/Reshape_output_0", "/blocks.26/self_attn/q_norm/Cast_output_0", "/blocks.26/self_attn/q_norm/Mul_1_output_0", "/blocks.26/self_attn/Mul_output_0", "/blocks.26/self_attn/Shape_2_output_0", "Shape3999", "Rank4001", "BinaryOp4003", "Unsqueeze4004", "BinaryOp4006", "Unsqueeze4007", "StridedSlice4010", "Squeeze4011", "BinaryOp4012", "BinaryOp4013", "/blocks.26/self_attn/Gather_2_output_0", "/blocks.26/self_attn/Div_output_0", "/blocks.26/self_attn/Unsqueeze_7_output_0", "/blocks.26/self_attn/Slice_1_output_0", "/blocks.26/self_attn/Neg_output_0", "/blocks.26/self_attn/Unsqueeze_6_output_0", "/blocks.26/self_attn/Slice_output_0", "/blocks.26/self_attn/Concat_3_output_0", "/blocks.26/self_attn/Mul_1_output_0", "/blocks.26/self_attn/Add_output_0", "/blocks.26/self_attn/k_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_2_output_0", "/blocks.26/self_attn/Unsqueeze_3_output_0", "/blocks.26/self_attn/Concat_1_output_0", "/blocks.26/self_attn/Reshape_1_output_0", "/blocks.26/self_attn/k_norm/Cast_output_0", "/blocks.26/self_attn/k_norm/Mul_1_output_0", "/blocks.26/self_attn/Mul_2_output_0", "/blocks.26/self_attn/Shape_3_output_0", "Shape4041", "Rank4043", "BinaryOp4045", "Unsqueeze4046", "BinaryOp4048", "Unsqueeze4049", "StridedSlice4052", "Squeeze4053", "BinaryOp4054", "BinaryOp4055", "/blocks.26/self_attn/Gather_3_output_0", "/blocks.26/self_attn/Div_1_output_0", "/blocks.26/self_attn/Unsqueeze_9_output_0", "/blocks.26/self_attn/Slice_3_output_0", "/blocks.26/self_attn/Neg_1_output_0", "/blocks.26/self_attn/Unsqueeze_8_output_0", "/blocks.26/self_attn/Slice_2_output_0", "/blocks.26/self_attn/Concat_4_output_0", "/blocks.26/self_attn/Mul_3_output_0", "/blocks.26/self_attn/Add_1_output_0", "/blocks.26/self_attn/v_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_4_output_0", "/blocks.26/self_attn/Unsqueeze_5_output_0", "/blocks.26/self_attn/Concat_2_output_0", "/blocks.26/self_attn/Reshape_2_output_0", "/blocks.26/self_attn/fused_attn/FusedAttention_output_0", "/blocks.26/self_attn/o_proj/FakeLinear_output_0", "/blocks.26/Add_output_0", "/blocks.26/post_attention_layernorm/Mul_1_output_0", "/blocks.26/mlp/gate_proj/FakeLinear_output_0", "/blocks.26/mlp/act_fn/Mul_output_0", "/blocks.26/mlp/up_proj/FakeLinear_output_0", "/blocks.26/mlp/Mul_output_0", "/blocks.26/mlp/down_proj/FakeLinear_output_0", "/blocks.26/Add_1_output_0", "/blocks.27/Reshape_output_0", "/blocks.27/input_layernorm/Mul_1_output_0", "/blocks.27/self_attn/q_proj/FakeLinear_output_0", "/blocks.27/self_attn/Shape_output_0", "Shape4102", "Rank4104", "BinaryOp4106", "Unsqueeze4107", "BinaryOp4109", "Unsqueeze4110", "StridedSlice4113", "Squeeze4114", "BinaryOp4116", "/blocks.27/self_attn/Gather_output_0", "/blocks.27/self_attn/Unsqueeze_output_0", "Unsqueeze4124", "Unsqueeze4127", "StridedSlice4130", "Squeeze4131", "BinaryOp4132", "BinaryOp4133", "/blocks.27/self_attn/Gather_1_output_0", "/blocks.27/self_attn/Unsqueeze_1_output_0", "/blocks.27/self_attn/Concat_output_0", "/blocks.27/self_attn/Reshape_output_0", "/blocks.27/self_attn/q_norm/Cast_output_0", "/blocks.27/self_attn/q_norm/Mul_1_output_0", "/blocks.27/self_attn/Mul_output_0", "/blocks.27/self_attn/Shape_2_output_0", "Shape4148", "Rank4150", "BinaryOp4152", "Unsqueeze4153", "BinaryOp4155", "Unsqueeze4156", "StridedSlice4159", "Squeeze4160", "BinaryOp4161", "BinaryOp4162", "/blocks.27/self_attn/Gather_2_output_0", "/blocks.27/self_attn/Div_output_0", "/blocks.27/self_attn/Unsqueeze_7_output_0", "/blocks.27/self_attn/Slice_1_output_0", "/blocks.27/self_attn/Neg_output_0", "/blocks.27/self_attn/Unsqueeze_6_output_0", "/blocks.27/self_attn/Slice_output_0", "/blocks.27/self_attn/Concat_3_output_0", "/blocks.27/self_attn/Mul_1_output_0", "/blocks.27/self_attn/Add_output_0", "/blocks.27/self_attn/k_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_2_output_0", "/blocks.27/self_attn/Unsqueeze_3_output_0", "/blocks.27/self_attn/Concat_1_output_0", "/blocks.27/self_attn/Reshape_1_output_0", "/blocks.27/self_attn/k_norm/Cast_output_0", "/blocks.27/self_attn/k_norm/Mul_1_output_0", "/blocks.27/self_attn/Mul_2_output_0", "/blocks.27/self_attn/Shape_3_output_0", "Shape4190", "Rank4192", "BinaryOp4194", "Unsqueeze4195", "BinaryOp4197", "Unsqueeze4198", "StridedSlice4201", "Squeeze4202", "BinaryOp4203", "BinaryOp4204", "/blocks.27/self_attn/Gather_3_output_0", "/blocks.27/self_attn/Div_1_output_0", "/blocks.27/self_attn/Unsqueeze_9_output_0", "/blocks.27/self_attn/Slice_3_output_0", "/blocks.27/self_attn/Neg_1_output_0", "/blocks.27/self_attn/Unsqueeze_8_output_0", "/blocks.27/self_attn/Slice_2_output_0", "/blocks.27/self_attn/Concat_4_output_0", "/blocks.27/self_attn/Mul_3_output_0", "/blocks.27/self_attn/Add_1_output_0", "/blocks.27/self_attn/v_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_4_output_0", "/blocks.27/self_attn/Unsqueeze_5_output_0", "/blocks.27/self_attn/Concat_2_output_0", "/blocks.27/self_attn/Reshape_2_output_0", "/blocks.27/self_attn/fused_attn/FusedAttention_output_0", "/blocks.27/self_attn/o_proj/FakeLinear_output_0", "/blocks.27/Add_output_0", "/blocks.27/post_attention_layernorm/Mul_1_output_0", "/blocks.27/mlp/gate_proj/FakeLinear_output_0", "/blocks.27/mlp/act_fn/Mul_output_0", "/blocks.27/mlp/up_proj/FakeLinear_output_0", "/blocks.27/mlp/Mul_output_0", "/blocks.27/mlp/down_proj/FakeLinear_output_0", "/blocks.27/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "623efb03-4a9b-4840-b815-841594394369" }