segmind-vega-amdnpu / vae_encoder /dd /cache /NhwcConv_0-encoderconv_inConv_meta.json
bconsolvo's picture
vae encoder
75bb598
{
"dd_meta_major_version": 1,
"dd_meta_minor_version": 4,
"state_table_updates": [],
"op_list": [
{
"name": "NhwcConv_0-/encoder/conv_in/Conv",
"type": "SDConv",
"in_args": [
"Transpose_0_out-init_image.out2_3_0"
],
"const_args": [
"NhwcConv_0_weight_NHWC"
],
"out_args": [
"NhwcConv_0_out-/encoder/conv_in/Conv_output_0.out2_3_0"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"4"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"4"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_0",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_0_out-/encoder/conv_in/Conv_output_0.out2_3_0"
],
"const_args": [
"GroupNorm_0_wts_6_0_0"
],
"out_args": [
"GroupNorm_0.out12_0.out6_0_0"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"wts_shape": {
"type": "int",
"value": [
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"128"
]
},
"beta_shape": {
"type": "int",
"value": [
"128"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_1-/encoder/down_blocks.0/resnets.0/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_0.out12_0.out6_0_0"
],
"const_args": [
"NhwcConv_1_weight_NHWC"
],
"out_args": [
"NhwcConv_1_out-/encoder/down_blocks.0/resnets.0/conv1/Conv_output_0.out2_3_1"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_1",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_1_out-/encoder/down_blocks.0/resnets.0/conv1/Conv_output_0.out2_3_1"
],
"const_args": [
"GroupNorm_1_wts_6_0_1"
],
"out_args": [
"GroupNorm_1.out12_1.out6_0_1"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"wts_shape": {
"type": "int",
"value": [
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"128"
]
},
"beta_shape": {
"type": "int",
"value": [
"128"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_2-/encoder/down_blocks.0/resnets.0/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_1.out12_1.out6_0_1"
],
"const_args": [
"NhwcConv_2_weight_NHWC"
],
"out_args": [
"NhwcConv_2_out-/encoder/down_blocks.0/resnets.0/conv2/Conv_output_0.out2_3_2"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.0/resnets.0/Add",
"type": "SDAdd",
"in_args": [
"NhwcConv_0_out-/encoder/conv_in/Conv_output_0.out2_3_0",
"NhwcConv_2_out-/encoder/down_blocks.0/resnets.0/conv2/Conv_output_0.out2_3_2"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.0/resnets.0/Add.out_4_1_0"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_2",
"type": "SDGroupNorm",
"in_args": [
"/encoder/down_blocks.0/resnets.0/Add.out_4_1_0"
],
"const_args": [
"GroupNorm_2_wts_6_0_2"
],
"out_args": [
"GroupNorm_2.out12_2.out6_0_2"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"wts_shape": {
"type": "int",
"value": [
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"128"
]
},
"beta_shape": {
"type": "int",
"value": [
"128"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_3-/encoder/down_blocks.0/resnets.1/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_2.out12_2.out6_0_2"
],
"const_args": [
"NhwcConv_3_weight_NHWC"
],
"out_args": [
"NhwcConv_3_out-/encoder/down_blocks.0/resnets.1/conv1/Conv_output_0.out2_3_3"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_3",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_3_out-/encoder/down_blocks.0/resnets.1/conv1/Conv_output_0.out2_3_3"
],
"const_args": [
"GroupNorm_3_wts_6_0_3"
],
"out_args": [
"GroupNorm_3.out12_3.out6_0_3"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"wts_shape": {
"type": "int",
"value": [
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"128"
]
},
"beta_shape": {
"type": "int",
"value": [
"128"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_4-/encoder/down_blocks.0/resnets.1/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_3.out12_3.out6_0_3"
],
"const_args": [
"NhwcConv_4_weight_NHWC"
],
"out_args": [
"NhwcConv_4_out-/encoder/down_blocks.0/resnets.1/conv2/Conv_output_0.out2_3_4"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.0/resnets.1/Add",
"type": "SDAdd",
"in_args": [
"/encoder/down_blocks.0/resnets.0/Add.out_4_1_0",
"NhwcConv_4_out-/encoder/down_blocks.0/resnets.1/conv2/Conv_output_0.out2_3_4"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.0/resnets.1/Add.out_4_1_1"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_5-/encoder/down_blocks.0/downsamplers.0/conv/Conv",
"type": "SDConv",
"in_args": [
"/encoder/down_blocks.0/resnets.1/Add.out_4_1_1"
],
"const_args": [
"NhwcConv_5_weight_NHWC"
],
"out_args": [
"NhwcConv_5_out-/encoder/down_blocks.0/downsamplers.0/conv/Conv_output_0.out2_3_5"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"strides": {
"type": "int",
"value": [
"2",
"2"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"1024",
"1024",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"128"
]
},
"weight_shape": {
"type": "int",
"value": [
"128",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_4",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_5_out-/encoder/down_blocks.0/downsamplers.0/conv/Conv_output_0.out2_3_5"
],
"const_args": [
"GroupNorm_4_wts_6_0_4"
],
"out_args": [
"GroupNorm_4.out12_4.out6_0_4"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"128"
]
},
"wts_shape": {
"type": "int",
"value": [
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"128"
]
},
"beta_shape": {
"type": "int",
"value": [
"128"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_6-/encoder/down_blocks.1/resnets.0/conv_shortcut/Conv",
"type": "SDConv",
"in_args": [
"NhwcConv_5_out-/encoder/down_blocks.0/downsamplers.0/conv/Conv_output_0.out2_3_5"
],
"const_args": [
"NhwcConv_6_weight_NHWC"
],
"out_args": [
"NhwcConv_6_out-/encoder/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out2_3_6"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"1",
"1"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"0",
"0"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"1",
"1",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "NhwcConv_7-/encoder/down_blocks.1/resnets.0/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_4.out12_4.out6_0_4"
],
"const_args": [
"NhwcConv_7_weight_NHWC"
],
"out_args": [
"NhwcConv_7_out-/encoder/down_blocks.1/resnets.0/conv1/Conv_output_0.out2_3_7"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"128"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"3",
"3",
"128"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_5",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_7_out-/encoder/down_blocks.1/resnets.0/conv1/Conv_output_0.out2_3_7"
],
"const_args": [
"GroupNorm_5_wts_6_0_5"
],
"out_args": [
"GroupNorm_5.out12_5.out6_0_5"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"wts_shape": {
"type": "int",
"value": [
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"256"
]
},
"beta_shape": {
"type": "int",
"value": [
"256"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_8-/encoder/down_blocks.1/resnets.0/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_5.out12_5.out6_0_5"
],
"const_args": [
"NhwcConv_8_weight_NHWC"
],
"out_args": [
"NhwcConv_8_out-/encoder/down_blocks.1/resnets.0/conv2/Conv_output_0.out2_3_8"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"3",
"3",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.1/resnets.0/Add",
"type": "SDAdd",
"in_args": [
"NhwcConv_6_out-/encoder/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out2_3_6",
"NhwcConv_8_out-/encoder/down_blocks.1/resnets.0/conv2/Conv_output_0.out2_3_8"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.1/resnets.0/Add.out_4_1_2"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_6",
"type": "SDGroupNorm",
"in_args": [
"/encoder/down_blocks.1/resnets.0/Add.out_4_1_2"
],
"const_args": [
"GroupNorm_6_wts_6_0_6"
],
"out_args": [
"GroupNorm_6.out12_6.out6_0_6"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"wts_shape": {
"type": "int",
"value": [
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"256"
]
},
"beta_shape": {
"type": "int",
"value": [
"256"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_9-/encoder/down_blocks.1/resnets.1/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_6.out12_6.out6_0_6"
],
"const_args": [
"NhwcConv_9_weight_NHWC"
],
"out_args": [
"NhwcConv_9_out-/encoder/down_blocks.1/resnets.1/conv1/Conv_output_0.out2_3_9"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"3",
"3",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_7",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_9_out-/encoder/down_blocks.1/resnets.1/conv1/Conv_output_0.out2_3_9"
],
"const_args": [
"GroupNorm_7_wts_6_0_7"
],
"out_args": [
"GroupNorm_7.out12_7.out6_0_7"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"wts_shape": {
"type": "int",
"value": [
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"256"
]
},
"beta_shape": {
"type": "int",
"value": [
"256"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_10-/encoder/down_blocks.1/resnets.1/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_7.out12_7.out6_0_7"
],
"const_args": [
"NhwcConv_10_weight_NHWC"
],
"out_args": [
"NhwcConv_10_out-/encoder/down_blocks.1/resnets.1/conv2/Conv_output_0.out2_3_10"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"3",
"3",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.1/resnets.1/Add",
"type": "SDAdd",
"in_args": [
"/encoder/down_blocks.1/resnets.0/Add.out_4_1_2",
"NhwcConv_10_out-/encoder/down_blocks.1/resnets.1/conv2/Conv_output_0.out2_3_10"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.1/resnets.1/Add.out_4_1_3"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_11-/encoder/down_blocks.1/downsamplers.0/conv/Conv",
"type": "SDConv",
"in_args": [
"/encoder/down_blocks.1/resnets.1/Add.out_4_1_3"
],
"const_args": [
"NhwcConv_11_weight_NHWC"
],
"out_args": [
"NhwcConv_11_out-/encoder/down_blocks.1/downsamplers.0/conv/Conv_output_0.out2_3_11"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"strides": {
"type": "int",
"value": [
"2",
"2"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"512",
"512",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"256"
]
},
"weight_shape": {
"type": "int",
"value": [
"256",
"3",
"3",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_8",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_11_out-/encoder/down_blocks.1/downsamplers.0/conv/Conv_output_0.out2_3_11"
],
"const_args": [
"GroupNorm_8_wts_6_0_8"
],
"out_args": [
"GroupNorm_8.out12_8.out6_0_8"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"256"
]
},
"wts_shape": {
"type": "int",
"value": [
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"256"
]
},
"beta_shape": {
"type": "int",
"value": [
"256"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_12-/encoder/down_blocks.2/resnets.0/conv_shortcut/Conv",
"type": "SDConv",
"in_args": [
"NhwcConv_11_out-/encoder/down_blocks.1/downsamplers.0/conv/Conv_output_0.out2_3_11"
],
"const_args": [
"NhwcConv_12_weight_NHWC"
],
"out_args": [
"NhwcConv_12_out-/encoder/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out2_3_12"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"1",
"1"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"0",
"0"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"1",
"1",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "NhwcConv_13-/encoder/down_blocks.2/resnets.0/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_8.out12_8.out6_0_8"
],
"const_args": [
"NhwcConv_13_weight_NHWC"
],
"out_args": [
"NhwcConv_13_out-/encoder/down_blocks.2/resnets.0/conv1/Conv_output_0.out2_3_13"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"256"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"256"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_9",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_13_out-/encoder/down_blocks.2/resnets.0/conv1/Conv_output_0.out2_3_13"
],
"const_args": [
"GroupNorm_9_wts_6_0_9"
],
"out_args": [
"GroupNorm_9.out12_9.out6_0_9"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_14-/encoder/down_blocks.2/resnets.0/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_9.out12_9.out6_0_9"
],
"const_args": [
"NhwcConv_14_weight_NHWC"
],
"out_args": [
"NhwcConv_14_out-/encoder/down_blocks.2/resnets.0/conv2/Conv_output_0.out2_3_14"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.2/resnets.0/Add",
"type": "SDAdd",
"in_args": [
"NhwcConv_12_out-/encoder/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out2_3_12",
"NhwcConv_14_out-/encoder/down_blocks.2/resnets.0/conv2/Conv_output_0.out2_3_14"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.2/resnets.0/Add.out_4_1_4"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_10",
"type": "SDGroupNorm",
"in_args": [
"/encoder/down_blocks.2/resnets.0/Add.out_4_1_4"
],
"const_args": [
"GroupNorm_10_wts_6_0_10"
],
"out_args": [
"GroupNorm_10.out12_10.out6_0_10"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_15-/encoder/down_blocks.2/resnets.1/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_10.out12_10.out6_0_10"
],
"const_args": [
"NhwcConv_15_weight_NHWC"
],
"out_args": [
"NhwcConv_15_out-/encoder/down_blocks.2/resnets.1/conv1/Conv_output_0.out2_3_15"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_11",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_15_out-/encoder/down_blocks.2/resnets.1/conv1/Conv_output_0.out2_3_15"
],
"const_args": [
"GroupNorm_11_wts_6_0_11"
],
"out_args": [
"GroupNorm_11.out12_11.out6_0_11"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_16-/encoder/down_blocks.2/resnets.1/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_11.out12_11.out6_0_11"
],
"const_args": [
"NhwcConv_16_weight_NHWC"
],
"out_args": [
"NhwcConv_16_out-/encoder/down_blocks.2/resnets.1/conv2/Conv_output_0.out2_3_16"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.2/resnets.1/Add",
"type": "SDAdd",
"in_args": [
"/encoder/down_blocks.2/resnets.0/Add.out_4_1_4",
"NhwcConv_16_out-/encoder/down_blocks.2/resnets.1/conv2/Conv_output_0.out2_3_16"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.2/resnets.1/Add.out_4_1_5"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_17-/encoder/down_blocks.2/downsamplers.0/conv/Conv",
"type": "SDConv",
"in_args": [
"/encoder/down_blocks.2/resnets.1/Add.out_4_1_5"
],
"const_args": [
"NhwcConv_17_weight_NHWC"
],
"out_args": [
"NhwcConv_17_out-/encoder/down_blocks.2/downsamplers.0/conv/Conv_output_0.out2_3_17"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"strides": {
"type": "int",
"value": [
"2",
"2"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"256",
"256",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_12",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_17_out-/encoder/down_blocks.2/downsamplers.0/conv/Conv_output_0.out2_3_17"
],
"const_args": [
"GroupNorm_12_wts_6_0_12"
],
"out_args": [
"GroupNorm_12.out12_12.out6_0_12"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_18-/encoder/down_blocks.3/resnets.0/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_12.out12_12.out6_0_12"
],
"const_args": [
"NhwcConv_18_weight_NHWC"
],
"out_args": [
"NhwcConv_18_out-/encoder/down_blocks.3/resnets.0/conv1/Conv_output_0.out2_3_18"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_13",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_18_out-/encoder/down_blocks.3/resnets.0/conv1/Conv_output_0.out2_3_18"
],
"const_args": [
"GroupNorm_13_wts_6_0_13"
],
"out_args": [
"GroupNorm_13.out12_13.out6_0_13"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_19-/encoder/down_blocks.3/resnets.0/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_13.out12_13.out6_0_13"
],
"const_args": [
"NhwcConv_19_weight_NHWC"
],
"out_args": [
"NhwcConv_19_out-/encoder/down_blocks.3/resnets.0/conv2/Conv_output_0.out2_3_19"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.3/resnets.0/Add",
"type": "SDAdd",
"in_args": [
"NhwcConv_17_out-/encoder/down_blocks.2/downsamplers.0/conv/Conv_output_0.out2_3_17",
"NhwcConv_19_out-/encoder/down_blocks.3/resnets.0/conv2/Conv_output_0.out2_3_19"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.3/resnets.0/Add.out_4_1_6"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_14",
"type": "SDGroupNorm",
"in_args": [
"/encoder/down_blocks.3/resnets.0/Add.out_4_1_6"
],
"const_args": [
"GroupNorm_14_wts_6_0_14"
],
"out_args": [
"GroupNorm_14.out12_14.out6_0_14"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_20-/encoder/down_blocks.3/resnets.1/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_14.out12_14.out6_0_14"
],
"const_args": [
"NhwcConv_20_weight_NHWC"
],
"out_args": [
"NhwcConv_20_out-/encoder/down_blocks.3/resnets.1/conv1/Conv_output_0.out2_3_20"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_15",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_20_out-/encoder/down_blocks.3/resnets.1/conv1/Conv_output_0.out2_3_20"
],
"const_args": [
"GroupNorm_15_wts_6_0_15"
],
"out_args": [
"GroupNorm_15.out12_15.out6_0_15"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_21-/encoder/down_blocks.3/resnets.1/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_15.out12_15.out6_0_15"
],
"const_args": [
"NhwcConv_21_weight_NHWC"
],
"out_args": [
"NhwcConv_21_out-/encoder/down_blocks.3/resnets.1/conv2/Conv_output_0.out2_3_21"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/down_blocks.3/resnets.1/Add",
"type": "SDAdd",
"in_args": [
"/encoder/down_blocks.3/resnets.0/Add.out_4_1_6",
"NhwcConv_21_out-/encoder/down_blocks.3/resnets.1/conv2/Conv_output_0.out2_3_21"
],
"const_args": [],
"out_args": [
"/encoder/down_blocks.3/resnets.1/Add.out_4_1_7"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_16",
"type": "SDGroupNorm",
"in_args": [
"/encoder/down_blocks.3/resnets.1/Add.out_4_1_7"
],
"const_args": [
"GroupNorm_16_wts_6_0_16"
],
"out_args": [
"GroupNorm_16.out12_16.out6_0_16"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_22-/encoder/mid_block/resnets.0/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_16.out12_16.out6_0_16"
],
"const_args": [
"NhwcConv_22_weight_NHWC"
],
"out_args": [
"NhwcConv_22_out-/encoder/mid_block/resnets.0/conv1/Conv_output_0.out2_3_22"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_17",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_22_out-/encoder/mid_block/resnets.0/conv1/Conv_output_0.out2_3_22"
],
"const_args": [
"GroupNorm_17_wts_6_0_17"
],
"out_args": [
"GroupNorm_17.out12_17.out6_0_17"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_23-/encoder/mid_block/resnets.0/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_17.out12_17.out6_0_17"
],
"const_args": [
"NhwcConv_23_weight_NHWC"
],
"out_args": [
"NhwcConv_23_out-/encoder/mid_block/resnets.0/conv2/Conv_output_0.out2_3_23"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/mid_block/resnets.0/Add",
"type": "SDAdd",
"in_args": [
"/encoder/down_blocks.3/resnets.1/Add.out_4_1_7",
"NhwcConv_23_out-/encoder/mid_block/resnets.0/conv2/Conv_output_0.out2_3_23"
],
"const_args": [],
"out_args": [
"/encoder/mid_block/resnets.0/Add.out_4_1_8"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_18",
"type": "SDGroupNorm",
"in_args": [
"/encoder/mid_block/resnets.0/Add.out_4_1_8"
],
"const_args": [
"GroupNorm_18_wts_6_1_0"
],
"out_args": [
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/to_k/MatMul/MatMulAddFusion",
"type": "SDGemm",
"in_args": [
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0"
],
"const_args": [
"onnx::MatMul_890_2_0_0"
],
"out_args": [
"/encoder/mid_block/attentions.0/Reshape_2_output_0_3d.out3_3_0"
],
"attrs": {
"input_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"bias_enable": {
"type": "int",
"value": [
"1"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"bfloat16"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/to_q/MatMul/MatMulAddFusion",
"type": "SDGemm",
"in_args": [
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0"
],
"const_args": [
"onnx::MatMul_889_2_0_1"
],
"out_args": [
"/encoder/mid_block/attentions.0/Reshape_1_output_0_3d.out3_3_1"
],
"attrs": {
"input_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"bias_enable": {
"type": "int",
"value": [
"1"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"bfloat16"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/to_v/MatMul/MatMulAddFusion",
"type": "SDGemm",
"in_args": [
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0"
],
"const_args": [
"onnx::MatMul_891_2_0_2"
],
"out_args": [
"/encoder/mid_block/attentions.0/Reshape_3_output_0_3d.out3_3_2"
],
"attrs": {
"input_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"bias_enable": {
"type": "int",
"value": [
"1"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"bfloat16"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/MatMul/MatMulScaleFusion/_FusedActivationmha_3_1_0",
"type": "SDMHA_VAE",
"in_args": [
"/encoder/mid_block/attentions.0/Reshape_1_output_0_3d.out3_3_1",
"/encoder/mid_block/attentions.0/Reshape_2_output_0_3d.out3_3_0",
"/encoder/mid_block/attentions.0/Reshape_3_output_0_3d.out3_3_2"
],
"const_args": [
"/encoder/mid_block/attentions.0/MatMul/MatMulScaleFusion/_FusedActivationmha_3_1_0_mask.12_0"
],
"out_args": [
"/encoder/mid_block/attentions.0/Transpose_5_output_0_3d.out12_0"
],
"attrs": {
"num_heads": {
"type": "int",
"value": [
"1"
]
},
"unidirectional": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"16384",
"512",
"16384"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"op_version": {
"type": "str",
"value": [
"v1.0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/to_out.0/MatMul/MatMulAddFusion",
"type": "SDGemm",
"in_args": [
"/encoder/mid_block/attentions.0/Transpose_5_output_0_3d.out12_0"
],
"const_args": [
"onnx::MatMul_899_2_0_3"
],
"out_args": [
"/encoder/mid_block/attentions.0/Reshape_5_output_0.nhwc6_0.out3_0_0"
],
"attrs": {
"input_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"16384",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"bias_enable": {
"type": "int",
"value": [
"1"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"bfloat16"
]
}
}
},
{
"name": "/encoder/mid_block/attentions.0/Add",
"type": "SDAdd",
"in_args": [
"/encoder/mid_block/attentions.0/Reshape_5_output_0.nhwc6_0.out3_0_0",
"/encoder/mid_block/resnets.0/Add.out_4_1_8"
],
"const_args": [],
"out_args": [
"/encoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_9"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_19",
"type": "SDGroupNorm",
"in_args": [
"/encoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_9"
],
"const_args": [
"GroupNorm_19_wts_6_0_18"
],
"out_args": [
"GroupNorm_19.out12_19.out6_0_18"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_24-/encoder/mid_block/resnets.1/conv1/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_19.out12_19.out6_0_18"
],
"const_args": [
"NhwcConv_24_weight_NHWC"
],
"out_args": [
"NhwcConv_24_out-/encoder/mid_block/resnets.1/conv1/Conv_output_0.out2_3_24"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "GroupNorm_20",
"type": "SDGroupNorm",
"in_args": [
"NhwcConv_24_out-/encoder/mid_block/resnets.1/conv1/Conv_output_0.out2_3_24"
],
"const_args": [
"GroupNorm_20_wts_6_0_19"
],
"out_args": [
"GroupNorm_20.out12_20.out6_0_19"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_25-/encoder/mid_block/resnets.1/conv2/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_20.out12_20.out6_0_19"
],
"const_args": [
"NhwcConv_25_weight_NHWC"
],
"out_args": [
"NhwcConv_25_out-/encoder/mid_block/resnets.1/conv2/Conv_output_0.out2_3_25"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"weight_shape": {
"type": "int",
"value": [
"512",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "/encoder/mid_block/resnets.1/Add",
"type": "SDAdd",
"in_args": [
"/encoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_9",
"NhwcConv_25_out-/encoder/mid_block/resnets.1/conv2/Conv_output_0.out2_3_25"
],
"const_args": [],
"out_args": [
"/encoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_10"
],
"attrs": {
"a_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"b_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"c_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"is_bias_add": {
"type": "int",
"value": [
"0"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "GroupNorm_21",
"type": "SDGroupNorm",
"in_args": [
"/encoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_10"
],
"const_args": [
"GroupNorm_21_wts_6_0_20"
],
"out_args": [
"GroupNorm_21.out12_21.out6_0_20"
],
"attrs": {
"epsilon": {
"type": "float",
"value": [
"9.999999974752427e-07"
]
},
"groups": {
"type": "int",
"value": [
"32"
]
},
"channels_last": {
"type": "int",
"value": [
"1"
]
},
"activation": {
"type": "int",
"value": [
"0"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"wts_shape": {
"type": "int",
"value": [
"1024"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfloat16"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"gamma_shape": {
"type": "int",
"value": [
"512"
]
},
"beta_shape": {
"type": "int",
"value": [
"512"
]
},
"nonlinear": {
"type": "str",
"value": [
"Silu"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
}
}
},
{
"name": "NhwcConv_26-/encoder/conv_out/Conv",
"type": "SDConv",
"in_args": [
"GroupNorm_21.out12_21.out6_0_20"
],
"const_args": [
"NhwcConv_26_weight_NHWC"
],
"out_args": [
"NhwcConv_26_out-/encoder/conv_out/Conv_output_0.out2_3_26"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"3",
"3"
]
},
"pads": {
"type": "int",
"value": [
"1",
"1",
"1",
"1"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"512"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"8"
]
},
"weight_shape": {
"type": "int",
"value": [
"8",
"3",
"3",
"512"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
},
{
"name": "NhwcConv_27-/quant_conv/Conv",
"type": "SDConv",
"in_args": [
"NhwcConv_26_out-/encoder/conv_out/Conv_output_0.out2_3_26"
],
"const_args": [
"NhwcConv_27_weight_NHWC"
],
"out_args": [
"NhwcConv_27_out-/quant_conv/Conv_output_0.out2_3_27"
],
"attrs": {
"auto_pad": {
"type": "str",
"value": [
"NOTSET"
]
},
"dilations": {
"type": "int",
"value": [
"1",
"1"
]
},
"group": {
"type": "int",
"value": [
"1"
]
},
"kernel_shape": {
"type": "int",
"value": [
"1",
"1"
]
},
"pads": {
"type": "int",
"value": [
"0",
"0",
"0",
"0"
]
},
"strides": {
"type": "int",
"value": [
"1",
"1"
]
},
"input_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"8"
]
},
"output_shape": {
"type": "int",
"value": [
"1",
"128",
"128",
"8"
]
},
"weight_shape": {
"type": "int",
"value": [
"8",
"1",
"1",
"8"
]
},
"out_dtypes": {
"type": "str",
"value": [
"bfloat16"
]
},
"ctrl_packet": {
"type": "int",
"value": [
"1"
]
},
"in_dtypes": {
"type": "str",
"value": [
"bfloat16",
"bfp16ebs8",
"float"
]
}
}
}
],
"fused_tensors": {
"in": {
"buffer_size": 8388608,
"xrt_arg_id": 0,
"packed_tensors": [
"Transpose_0_out-init_image.out2_3_0"
]
},
"out": {
"buffer_size": 262144,
"xrt_arg_id": 1,
"packed_tensors": [
"NhwcConv_27_out-/quant_conv/Conv_output_0.out2_3_27"
]
},
"scratch": {
"buffer_size": 5654183936,
"xrt_arg_id": 2,
"packed_tensors": [
"NhwcConv_0_out-/encoder/conv_in/Conv_output_0.out2_3_0",
"GroupNorm_0.out12_0.out6_0_0",
"NhwcConv_1_out-/encoder/down_blocks.0/resnets.0/conv1/Conv_output_0.out2_3_1",
"GroupNorm_1.out12_1.out6_0_1",
"NhwcConv_2_out-/encoder/down_blocks.0/resnets.0/conv2/Conv_output_0.out2_3_2",
"/encoder/down_blocks.0/resnets.0/Add.out_4_1_0",
"GroupNorm_2.out12_2.out6_0_2",
"NhwcConv_3_out-/encoder/down_blocks.0/resnets.1/conv1/Conv_output_0.out2_3_3",
"GroupNorm_3.out12_3.out6_0_3",
"NhwcConv_4_out-/encoder/down_blocks.0/resnets.1/conv2/Conv_output_0.out2_3_4",
"/encoder/down_blocks.0/resnets.1/Add.out_4_1_1",
"NhwcConv_5_out-/encoder/down_blocks.0/downsamplers.0/conv/Conv_output_0.out2_3_5",
"GroupNorm_4.out12_4.out6_0_4",
"NhwcConv_6_out-/encoder/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out2_3_6",
"NhwcConv_7_out-/encoder/down_blocks.1/resnets.0/conv1/Conv_output_0.out2_3_7",
"GroupNorm_5.out12_5.out6_0_5",
"NhwcConv_8_out-/encoder/down_blocks.1/resnets.0/conv2/Conv_output_0.out2_3_8",
"/encoder/down_blocks.1/resnets.0/Add.out_4_1_2",
"GroupNorm_6.out12_6.out6_0_6",
"NhwcConv_9_out-/encoder/down_blocks.1/resnets.1/conv1/Conv_output_0.out2_3_9",
"GroupNorm_7.out12_7.out6_0_7",
"NhwcConv_10_out-/encoder/down_blocks.1/resnets.1/conv2/Conv_output_0.out2_3_10",
"/encoder/down_blocks.1/resnets.1/Add.out_4_1_3",
"NhwcConv_11_out-/encoder/down_blocks.1/downsamplers.0/conv/Conv_output_0.out2_3_11",
"GroupNorm_8.out12_8.out6_0_8",
"NhwcConv_12_out-/encoder/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out2_3_12",
"NhwcConv_13_out-/encoder/down_blocks.2/resnets.0/conv1/Conv_output_0.out2_3_13",
"GroupNorm_9.out12_9.out6_0_9",
"NhwcConv_14_out-/encoder/down_blocks.2/resnets.0/conv2/Conv_output_0.out2_3_14",
"/encoder/down_blocks.2/resnets.0/Add.out_4_1_4",
"GroupNorm_10.out12_10.out6_0_10",
"NhwcConv_15_out-/encoder/down_blocks.2/resnets.1/conv1/Conv_output_0.out2_3_15",
"GroupNorm_11.out12_11.out6_0_11",
"NhwcConv_16_out-/encoder/down_blocks.2/resnets.1/conv2/Conv_output_0.out2_3_16",
"/encoder/down_blocks.2/resnets.1/Add.out_4_1_5",
"NhwcConv_17_out-/encoder/down_blocks.2/downsamplers.0/conv/Conv_output_0.out2_3_17",
"GroupNorm_12.out12_12.out6_0_12",
"NhwcConv_18_out-/encoder/down_blocks.3/resnets.0/conv1/Conv_output_0.out2_3_18",
"GroupNorm_13.out12_13.out6_0_13",
"NhwcConv_19_out-/encoder/down_blocks.3/resnets.0/conv2/Conv_output_0.out2_3_19",
"/encoder/down_blocks.3/resnets.0/Add.out_4_1_6",
"GroupNorm_14.out12_14.out6_0_14",
"NhwcConv_20_out-/encoder/down_blocks.3/resnets.1/conv1/Conv_output_0.out2_3_20",
"GroupNorm_15.out12_15.out6_0_15",
"NhwcConv_21_out-/encoder/down_blocks.3/resnets.1/conv2/Conv_output_0.out2_3_21",
"/encoder/down_blocks.3/resnets.1/Add.out_4_1_7",
"GroupNorm_16.out12_16.out6_0_16",
"NhwcConv_22_out-/encoder/mid_block/resnets.0/conv1/Conv_output_0.out2_3_22",
"GroupNorm_17.out12_17.out6_0_17",
"NhwcConv_23_out-/encoder/mid_block/resnets.0/conv2/Conv_output_0.out2_3_23",
"/encoder/mid_block/resnets.0/Add.out_4_1_8",
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0",
"/encoder/mid_block/attentions.0/Reshape_2_output_0_3d.out3_3_0",
"/encoder/mid_block/attentions.0/Reshape_1_output_0_3d.out3_3_1",
"/encoder/mid_block/attentions.0/Reshape_3_output_0_3d.out3_3_2",
"/encoder/mid_block/attentions.0/Transpose_5_output_0_3d.out12_0",
"/encoder/mid_block/attentions.0/Reshape_5_output_0.nhwc6_0.out3_0_0",
"/encoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_9",
"GroupNorm_19.out12_19.out6_0_18",
"NhwcConv_24_out-/encoder/mid_block/resnets.1/conv1/Conv_output_0.out2_3_24",
"GroupNorm_20.out12_20.out6_0_19",
"NhwcConv_25_out-/encoder/mid_block/resnets.1/conv2/Conv_output_0.out2_3_25",
"/encoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_10",
"GroupNorm_21.out12_21.out6_0_20",
"NhwcConv_26_out-/encoder/conv_out/Conv_output_0.out2_3_26"
]
},
"const": {
"buffer_size": 42147856,
"xrt_arg_id": 3,
"packed_tensors": [
"NhwcConv_0_weight_NHWC",
"GroupNorm_0_wts_6_0_0",
"NhwcConv_1_weight_NHWC",
"GroupNorm_1_wts_6_0_1",
"NhwcConv_2_weight_NHWC",
"GroupNorm_2_wts_6_0_2",
"NhwcConv_3_weight_NHWC",
"GroupNorm_3_wts_6_0_3",
"NhwcConv_4_weight_NHWC",
"NhwcConv_5_weight_NHWC",
"GroupNorm_4_wts_6_0_4",
"NhwcConv_6_weight_NHWC",
"NhwcConv_7_weight_NHWC",
"GroupNorm_5_wts_6_0_5",
"NhwcConv_8_weight_NHWC",
"GroupNorm_6_wts_6_0_6",
"NhwcConv_9_weight_NHWC",
"GroupNorm_7_wts_6_0_7",
"NhwcConv_10_weight_NHWC",
"NhwcConv_11_weight_NHWC",
"GroupNorm_8_wts_6_0_8",
"NhwcConv_12_weight_NHWC",
"NhwcConv_13_weight_NHWC",
"GroupNorm_9_wts_6_0_9",
"NhwcConv_14_weight_NHWC",
"GroupNorm_10_wts_6_0_10",
"NhwcConv_15_weight_NHWC",
"GroupNorm_11_wts_6_0_11",
"NhwcConv_16_weight_NHWC",
"NhwcConv_17_weight_NHWC",
"GroupNorm_12_wts_6_0_12",
"NhwcConv_18_weight_NHWC",
"GroupNorm_13_wts_6_0_13",
"NhwcConv_19_weight_NHWC",
"GroupNorm_14_wts_6_0_14",
"NhwcConv_20_weight_NHWC",
"GroupNorm_15_wts_6_0_15",
"NhwcConv_21_weight_NHWC",
"GroupNorm_16_wts_6_0_16",
"NhwcConv_22_weight_NHWC",
"GroupNorm_17_wts_6_0_17",
"NhwcConv_23_weight_NHWC",
"GroupNorm_18_wts_6_1_0",
"onnx::MatMul_890_2_0_0",
"onnx::MatMul_889_2_0_1",
"onnx::MatMul_891_2_0_2",
"/encoder/mid_block/attentions.0/MatMul/MatMulScaleFusion/_FusedActivationmha_3_1_0_mask.12_0",
"onnx::MatMul_899_2_0_3",
"GroupNorm_19_wts_6_0_18",
"NhwcConv_24_weight_NHWC",
"GroupNorm_20_wts_6_0_19",
"NhwcConv_25_weight_NHWC",
"GroupNorm_21_wts_6_0_20",
"NhwcConv_26_weight_NHWC",
"NhwcConv_27_weight_NHWC"
]
},
"super_instr": {
"buffer_size": 0,
"xrt_arg_id": 4,
"packed_tensors": []
}
},
"tensor_map": {
"Transpose_0_out-init_image.out2_3_0": {
"packed_buffer_label": "in",
"xrt_arg_id": 0,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
4
],
"size_in_bytes": 8388608,
"op_tensor_size": 8388608,
"offset": 0
},
"NhwcConv_27_out-/quant_conv/Conv_output_0.out2_3_27": {
"packed_buffer_label": "out",
"xrt_arg_id": 1,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
8
],
"size_in_bytes": 262144,
"op_tensor_size": 262144,
"offset": 0
},
"NhwcConv_0_out-/encoder/conv_in/Conv_output_0.out2_3_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 0
},
"GroupNorm_0.out12_0.out6_0_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 268435456
},
"NhwcConv_1_out-/encoder/down_blocks.0/resnets.0/conv1/Conv_output_0.out2_3_1": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 536870912
},
"GroupNorm_1.out12_1.out6_0_1": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 805306368
},
"NhwcConv_2_out-/encoder/down_blocks.0/resnets.0/conv2/Conv_output_0.out2_3_2": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 1073741824
},
"/encoder/down_blocks.0/resnets.0/Add.out_4_1_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 1342177280
},
"GroupNorm_2.out12_2.out6_0_2": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 1610612736
},
"NhwcConv_3_out-/encoder/down_blocks.0/resnets.1/conv1/Conv_output_0.out2_3_3": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 1879048192
},
"GroupNorm_3.out12_3.out6_0_3": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 2147483648
},
"NhwcConv_4_out-/encoder/down_blocks.0/resnets.1/conv2/Conv_output_0.out2_3_4": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 2415919104
},
"/encoder/down_blocks.0/resnets.1/Add.out_4_1_1": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
1024,
1024,
128
],
"size_in_bytes": 268435456,
"op_tensor_size": 268435456,
"offset": 2684354560
},
"NhwcConv_5_out-/encoder/down_blocks.0/downsamplers.0/conv/Conv_output_0.out2_3_5": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
128
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 2952790016
},
"GroupNorm_4.out12_4.out6_0_4": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
128
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 3019898880
},
"NhwcConv_6_out-/encoder/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out2_3_6": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3087007744
},
"NhwcConv_7_out-/encoder/down_blocks.1/resnets.0/conv1/Conv_output_0.out2_3_7": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3221225472
},
"GroupNorm_5.out12_5.out6_0_5": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3355443200
},
"NhwcConv_8_out-/encoder/down_blocks.1/resnets.0/conv2/Conv_output_0.out2_3_8": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3489660928
},
"/encoder/down_blocks.1/resnets.0/Add.out_4_1_2": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3623878656
},
"GroupNorm_6.out12_6.out6_0_6": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3758096384
},
"NhwcConv_9_out-/encoder/down_blocks.1/resnets.1/conv1/Conv_output_0.out2_3_9": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 3892314112
},
"GroupNorm_7.out12_7.out6_0_7": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 4026531840
},
"NhwcConv_10_out-/encoder/down_blocks.1/resnets.1/conv2/Conv_output_0.out2_3_10": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 4160749568
},
"/encoder/down_blocks.1/resnets.1/Add.out_4_1_3": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
512,
512,
256
],
"size_in_bytes": 134217728,
"op_tensor_size": 134217728,
"offset": 4294967296
},
"NhwcConv_11_out-/encoder/down_blocks.1/downsamplers.0/conv/Conv_output_0.out2_3_11": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
256
],
"size_in_bytes": 33554432,
"op_tensor_size": 33554432,
"offset": 4429185024
},
"GroupNorm_8.out12_8.out6_0_8": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
256
],
"size_in_bytes": 33554432,
"op_tensor_size": 33554432,
"offset": 4462739456
},
"NhwcConv_12_out-/encoder/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out2_3_12": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4496293888
},
"NhwcConv_13_out-/encoder/down_blocks.2/resnets.0/conv1/Conv_output_0.out2_3_13": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4563402752
},
"GroupNorm_9.out12_9.out6_0_9": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4630511616
},
"NhwcConv_14_out-/encoder/down_blocks.2/resnets.0/conv2/Conv_output_0.out2_3_14": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4697620480
},
"/encoder/down_blocks.2/resnets.0/Add.out_4_1_4": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4764729344
},
"GroupNorm_10.out12_10.out6_0_10": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4831838208
},
"NhwcConv_15_out-/encoder/down_blocks.2/resnets.1/conv1/Conv_output_0.out2_3_15": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4898947072
},
"GroupNorm_11.out12_11.out6_0_11": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 4966055936
},
"NhwcConv_16_out-/encoder/down_blocks.2/resnets.1/conv2/Conv_output_0.out2_3_16": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 5033164800
},
"/encoder/down_blocks.2/resnets.1/Add.out_4_1_5": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
256,
256,
512
],
"size_in_bytes": 67108864,
"op_tensor_size": 67108864,
"offset": 5100273664
},
"NhwcConv_17_out-/encoder/down_blocks.2/downsamplers.0/conv/Conv_output_0.out2_3_17": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5167382528
},
"GroupNorm_12.out12_12.out6_0_12": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5184159744
},
"NhwcConv_18_out-/encoder/down_blocks.3/resnets.0/conv1/Conv_output_0.out2_3_18": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5200936960
},
"GroupNorm_13.out12_13.out6_0_13": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5217714176
},
"NhwcConv_19_out-/encoder/down_blocks.3/resnets.0/conv2/Conv_output_0.out2_3_19": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5234491392
},
"/encoder/down_blocks.3/resnets.0/Add.out_4_1_6": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5251268608
},
"GroupNorm_14.out12_14.out6_0_14": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5268045824
},
"NhwcConv_20_out-/encoder/down_blocks.3/resnets.1/conv1/Conv_output_0.out2_3_20": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5284823040
},
"GroupNorm_15.out12_15.out6_0_15": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5301600256
},
"NhwcConv_21_out-/encoder/down_blocks.3/resnets.1/conv2/Conv_output_0.out2_3_21": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5318377472
},
"/encoder/down_blocks.3/resnets.1/Add.out_4_1_7": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5335154688
},
"GroupNorm_16.out12_16.out6_0_16": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5351931904
},
"NhwcConv_22_out-/encoder/mid_block/resnets.0/conv1/Conv_output_0.out2_3_22": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5368709120
},
"GroupNorm_17.out12_17.out6_0_17": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5385486336
},
"NhwcConv_23_out-/encoder/mid_block/resnets.0/conv2/Conv_output_0.out2_3_23": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5402263552
},
"/encoder/mid_block/resnets.0/Add.out_4_1_8": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5419040768
},
"/encoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out6_1_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
16384,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5435817984
},
"/encoder/mid_block/attentions.0/Reshape_2_output_0_3d.out3_3_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
16384,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5452595200
},
"/encoder/mid_block/attentions.0/Reshape_1_output_0_3d.out3_3_1": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
16384,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5469372416
},
"/encoder/mid_block/attentions.0/Reshape_3_output_0_3d.out3_3_2": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
16384,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5486149632
},
"/encoder/mid_block/attentions.0/Transpose_5_output_0_3d.out12_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
16384,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5502926848
},
"/encoder/mid_block/attentions.0/Reshape_5_output_0.nhwc6_0.out3_0_0": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5519704064
},
"/encoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_9": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5536481280
},
"GroupNorm_19.out12_19.out6_0_18": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5553258496
},
"NhwcConv_24_out-/encoder/mid_block/resnets.1/conv1/Conv_output_0.out2_3_24": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5570035712
},
"GroupNorm_20.out12_20.out6_0_19": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5586812928
},
"NhwcConv_25_out-/encoder/mid_block/resnets.1/conv2/Conv_output_0.out2_3_25": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5603590144
},
"/encoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_10": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5620367360
},
"GroupNorm_21.out12_21.out6_0_20": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
512
],
"size_in_bytes": 16777216,
"op_tensor_size": 16777216,
"offset": 5637144576
},
"NhwcConv_26_out-/encoder/conv_out/Conv_output_0.out2_3_26": {
"packed_buffer_label": "scratch",
"xrt_arg_id": 2,
"dtype": "bfloat16",
"shape": [
1,
128,
128,
8
],
"size_in_bytes": 262144,
"op_tensor_size": 262144,
"offset": 5653921792
},
"NhwcConv_0_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
12416
],
"size_in_bytes": 12416,
"op_tensor_size": 12416,
"offset": 0,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_0.const",
"file_size": 12416
},
"GroupNorm_0_wts_6_0_0": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
256
],
"size_in_bytes": 512,
"op_tensor_size": 512,
"offset": 12416,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_1.const",
"file_size": 512
},
"NhwcConv_1_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
174080
],
"size_in_bytes": 174080,
"op_tensor_size": 174080,
"offset": 12928,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_2.const",
"file_size": 174080
},
"GroupNorm_1_wts_6_0_1": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
256
],
"size_in_bytes": 512,
"op_tensor_size": 512,
"offset": 187008,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_3.const",
"file_size": 512
},
"NhwcConv_2_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
174080
],
"size_in_bytes": 174080,
"op_tensor_size": 174080,
"offset": 187520,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_4.const",
"file_size": 174080
},
"GroupNorm_2_wts_6_0_2": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
256
],
"size_in_bytes": 512,
"op_tensor_size": 512,
"offset": 361600,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_5.const",
"file_size": 512
},
"NhwcConv_3_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
174080
],
"size_in_bytes": 174080,
"op_tensor_size": 174080,
"offset": 362112,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_6.const",
"file_size": 174080
},
"GroupNorm_3_wts_6_0_3": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
256
],
"size_in_bytes": 512,
"op_tensor_size": 512,
"offset": 536192,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_7.const",
"file_size": 512
},
"NhwcConv_4_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
174080
],
"size_in_bytes": 174080,
"op_tensor_size": 174080,
"offset": 536704,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_8.const",
"file_size": 174080
},
"NhwcConv_5_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
174080
],
"size_in_bytes": 174080,
"op_tensor_size": 174080,
"offset": 710784,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_9.const",
"file_size": 174080
},
"GroupNorm_4_wts_6_0_4": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
256
],
"size_in_bytes": 512,
"op_tensor_size": 512,
"offset": 884864,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_10.const",
"file_size": 512
},
"NhwcConv_6_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
40960
],
"size_in_bytes": 40960,
"op_tensor_size": 40960,
"offset": 885376,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_11.const",
"file_size": 40960
},
"NhwcConv_7_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
348160
],
"size_in_bytes": 348160,
"op_tensor_size": 348160,
"offset": 926336,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_12.const",
"file_size": 348160
},
"GroupNorm_5_wts_6_0_5": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
512
],
"size_in_bytes": 1024,
"op_tensor_size": 1024,
"offset": 1274496,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_13.const",
"file_size": 1024
},
"NhwcConv_8_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
729088
],
"size_in_bytes": 729088,
"op_tensor_size": 729088,
"offset": 1275520,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_14.const",
"file_size": 729088
},
"GroupNorm_6_wts_6_0_6": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
512
],
"size_in_bytes": 1024,
"op_tensor_size": 1024,
"offset": 2004608,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_15.const",
"file_size": 1024
},
"NhwcConv_9_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
729088
],
"size_in_bytes": 729088,
"op_tensor_size": 729088,
"offset": 2005632,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_16.const",
"file_size": 729088
},
"GroupNorm_7_wts_6_0_7": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
512
],
"size_in_bytes": 1024,
"op_tensor_size": 1024,
"offset": 2734720,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_17.const",
"file_size": 1024
},
"NhwcConv_10_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
729088
],
"size_in_bytes": 729088,
"op_tensor_size": 729088,
"offset": 2735744,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_18.const",
"file_size": 729088
},
"NhwcConv_11_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
729088
],
"size_in_bytes": 729088,
"op_tensor_size": 729088,
"offset": 3464832,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_19.const",
"file_size": 729088
},
"GroupNorm_8_wts_6_0_8": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
512
],
"size_in_bytes": 1024,
"op_tensor_size": 1024,
"offset": 4193920,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_20.const",
"file_size": 1024
},
"NhwcConv_12_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
155648
],
"size_in_bytes": 155648,
"op_tensor_size": 155648,
"offset": 4194944,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_21.const",
"file_size": 155648
},
"NhwcConv_13_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
1458176
],
"size_in_bytes": 1458176,
"op_tensor_size": 1458176,
"offset": 4350592,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_22.const",
"file_size": 1458176
},
"GroupNorm_9_wts_6_0_9": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 5808768,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_23.const",
"file_size": 2048
},
"NhwcConv_14_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 5810816,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_24.const",
"file_size": 2916352
},
"GroupNorm_10_wts_6_0_10": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 8727168,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_25.const",
"file_size": 2048
},
"NhwcConv_15_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 8729216,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_26.const",
"file_size": 2916352
},
"GroupNorm_11_wts_6_0_11": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 11645568,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_27.const",
"file_size": 2048
},
"NhwcConv_16_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 11647616,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_28.const",
"file_size": 2916352
},
"NhwcConv_17_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 14563968,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_29.const",
"file_size": 2916352
},
"GroupNorm_12_wts_6_0_12": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 17480320,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_30.const",
"file_size": 2048
},
"NhwcConv_18_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 17482368,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_31.const",
"file_size": 2916352
},
"GroupNorm_13_wts_6_0_13": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 20398720,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_32.const",
"file_size": 2048
},
"NhwcConv_19_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 20400768,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_33.const",
"file_size": 2916352
},
"GroupNorm_14_wts_6_0_14": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 23317120,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_34.const",
"file_size": 2048
},
"NhwcConv_20_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 23319168,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_35.const",
"file_size": 2916352
},
"GroupNorm_15_wts_6_0_15": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 26235520,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_36.const",
"file_size": 2048
},
"NhwcConv_21_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 26237568,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_37.const",
"file_size": 2916352
},
"GroupNorm_16_wts_6_0_16": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 29153920,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_38.const",
"file_size": 2048
},
"NhwcConv_22_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 29155968,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_39.const",
"file_size": 2916352
},
"GroupNorm_17_wts_6_0_17": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 32072320,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_40.const",
"file_size": 2048
},
"NhwcConv_23_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 32074368,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_41.const",
"file_size": 2916352
},
"GroupNorm_18_wts_6_1_0": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 34990720,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_42.const",
"file_size": 2048
},
"onnx::MatMul_890_2_0_0": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
299008
],
"size_in_bytes": 299008,
"op_tensor_size": 299008,
"offset": 34992768,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_43.const",
"file_size": 299008
},
"onnx::MatMul_889_2_0_1": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
299008
],
"size_in_bytes": 299008,
"op_tensor_size": 299008,
"offset": 35291776,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_44.const",
"file_size": 299008
},
"onnx::MatMul_891_2_0_2": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
299008
],
"size_in_bytes": 299008,
"op_tensor_size": 299008,
"offset": 35590784,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_45.const",
"file_size": 299008
},
"/encoder/mid_block/attentions.0/MatMul/MatMulScaleFusion/_FusedActivationmha_3_1_0_mask.12_0": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
16384
],
"size_in_bytes": 32768,
"op_tensor_size": 32768,
"offset": 35889792,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_46.const",
"file_size": 32768
},
"onnx::MatMul_899_2_0_3": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
299008
],
"size_in_bytes": 299008,
"op_tensor_size": 299008,
"offset": 35922560,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_47.const",
"file_size": 299008
},
"GroupNorm_19_wts_6_0_18": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 36221568,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_48.const",
"file_size": 2048
},
"NhwcConv_24_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 36223616,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_49.const",
"file_size": 2916352
},
"GroupNorm_20_wts_6_0_19": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 39139968,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_50.const",
"file_size": 2048
},
"NhwcConv_25_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
2916352
],
"size_in_bytes": 2916352,
"op_tensor_size": 2916352,
"offset": 39142016,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_51.const",
"file_size": 2916352
},
"GroupNorm_21_wts_6_0_20": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfloat16",
"shape": [
1024
],
"size_in_bytes": 2048,
"op_tensor_size": 2048,
"offset": 42058368,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_52.const",
"file_size": 2048
},
"NhwcConv_26_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
87040
],
"size_in_bytes": 87040,
"op_tensor_size": 87040,
"offset": 42060416,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_53.const",
"file_size": 87040
},
"NhwcConv_27_weight_NHWC": {
"packed_buffer_label": "const",
"xrt_arg_id": 3,
"dtype": "bfp16ebs8",
"shape": [
400
],
"size_in_bytes": 400,
"op_tensor_size": 400,
"offset": 42147456,
"file_name": "cache/NhwcConv_0-encoderconv_inConv_54.const",
"file_size": 400
}
},
"aux_info": {}
}