program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.2.2"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.3.0"}})] { func main(tensor logmel_data) { tensor var_32_pad_type_0 = const()[name = tensor("op_32_pad_type_0"), val = tensor("custom")]; tensor var_32_pad_0 = const()[name = tensor("op_32_pad_0"), val = tensor([1, 1])]; tensor var_32_strides_0 = const()[name = tensor("op_32_strides_0"), val = tensor([1])]; tensor var_32_dilations_0 = const()[name = tensor("op_32_dilations_0"), val = tensor([1])]; tensor var_32_groups_0 = const()[name = tensor("op_32_groups_0"), val = tensor(1)]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor const_0_to_fp16 = const()[name = tensor("const_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor const_1_to_fp16 = const()[name = tensor("const_1_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245888)))]; tensor logmel_data_to_fp16 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data)[name = tensor("cast_28")]; tensor var_32_cast_fp16 = conv(bias = const_1_to_fp16, dilations = var_32_dilations_0, groups = var_32_groups_0, pad = var_32_pad_0, pad_type = var_32_pad_type_0, strides = var_32_strides_0, weight = const_0_to_fp16, x = logmel_data_to_fp16)[name = tensor("op_32_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_32_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_50_pad_type_0 = const()[name = tensor("op_50_pad_type_0"), val = tensor("custom")]; tensor var_50_pad_0 = const()[name = tensor("op_50_pad_0"), val = tensor([1, 1])]; tensor var_50_strides_0 = const()[name = tensor("op_50_strides_0"), val = tensor([2])]; tensor var_50_dilations_0 = const()[name = tensor("op_50_dilations_0"), val = tensor([1])]; tensor var_50_groups_0 = const()[name = tensor("op_50_groups_0"), val = tensor(1)]; tensor const_2_to_fp16 = const()[name = tensor("const_2_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246976)))]; tensor const_3_to_fp16 = const()[name = tensor("const_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819904)))]; tensor var_50_cast_fp16 = conv(bias = const_3_to_fp16, dilations = var_50_dilations_0, groups = var_50_groups_0, pad = var_50_pad_0, pad_type = var_50_pad_type_0, strides = var_50_strides_0, weight = const_2_to_fp16, x = input_1_cast_fp16)[name = tensor("op_50_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_50_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_55_to_fp16 = const()[name = tensor("op_55_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1820992)))]; tensor var_57_cast_fp16 = add(x = x_3_cast_fp16, y = var_55_to_fp16)[name = tensor("op_57_cast_fp16")]; tensor inputs_1_axes_0 = const()[name = tensor("inputs_1_axes_0"), val = tensor([2])]; tensor inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = var_57_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor var_72 = const()[name = tensor("op_72"), val = tensor(1)]; tensor input_3_axes_0 = const()[name = tensor("input_3_axes_0"), val = tensor([1])]; tensor input_3_gamma_0_to_fp16 = const()[name = tensor("input_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3357056)))]; tensor input_3_beta_0_to_fp16 = const()[name = tensor("input_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3358144)))]; tensor var_88_to_fp16 = const()[name = tensor("op_88_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_3_cast_fp16 = layer_norm(axes = input_3_axes_0, beta = input_3_beta_0_to_fp16, epsilon = var_88_to_fp16, gamma = input_3_gamma_0_to_fp16, x = inputs_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor q_1_pad_type_0 = const()[name = tensor("q_1_pad_type_0"), val = tensor("valid")]; tensor q_1_strides_0 = const()[name = tensor("q_1_strides_0"), val = tensor([1, 1])]; tensor q_1_pad_0 = const()[name = tensor("q_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_1_dilations_0 = const()[name = tensor("q_1_dilations_0"), val = tensor([1, 1])]; tensor q_1_groups_0 = const()[name = tensor("q_1_groups_0"), val = tensor(1)]; tensor var_123_weight_0_to_fp16 = const()[name = tensor("op_123_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3359232)))]; tensor var_123_bias_0_to_fp16 = const()[name = tensor("op_123_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3883584)))]; tensor var_123_cast_fp16 = conv(bias = var_123_bias_0_to_fp16, dilations = q_1_dilations_0, groups = q_1_groups_0, pad = q_1_pad_0, pad_type = q_1_pad_type_0, strides = q_1_strides_0, weight = var_123_weight_0_to_fp16, x = input_3_cast_fp16)[name = tensor("op_123_cast_fp16")]; tensor k_1_pad_type_0 = const()[name = tensor("k_1_pad_type_0"), val = tensor("valid")]; tensor k_1_strides_0 = const()[name = tensor("k_1_strides_0"), val = tensor([1, 1])]; tensor k_1_pad_0 = const()[name = tensor("k_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_1_dilations_0 = const()[name = tensor("k_1_dilations_0"), val = tensor([1, 1])]; tensor k_1_groups_0 = const()[name = tensor("k_1_groups_0"), val = tensor(1)]; tensor blocks_0_attn_key_weight_to_fp16 = const()[name = tensor("blocks_0_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3884672)))]; tensor k_1_cast_fp16 = conv(dilations = k_1_dilations_0, groups = k_1_groups_0, pad = k_1_pad_0, pad_type = k_1_pad_type_0, strides = k_1_strides_0, weight = blocks_0_attn_key_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor var_121_pad_type_0 = const()[name = tensor("op_121_pad_type_0"), val = tensor("valid")]; tensor var_121_strides_0 = const()[name = tensor("op_121_strides_0"), val = tensor([1, 1])]; tensor var_121_pad_0 = const()[name = tensor("op_121_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_121_dilations_0 = const()[name = tensor("op_121_dilations_0"), val = tensor([1, 1])]; tensor var_121_groups_0 = const()[name = tensor("op_121_groups_0"), val = tensor(1)]; tensor blocks_0_attn_value_weight_to_fp16 = const()[name = tensor("blocks_0_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4409024)))]; tensor blocks_0_attn_value_bias_to_fp16 = const()[name = tensor("blocks_0_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4933376)))]; tensor var_121_cast_fp16 = conv(bias = blocks_0_attn_value_bias_to_fp16, dilations = var_121_dilations_0, groups = var_121_groups_0, pad = var_121_pad_0, pad_type = var_121_pad_type_0, strides = var_121_strides_0, weight = blocks_0_attn_value_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("op_121_cast_fp16")]; tensor tile_0 = const()[name = tensor("tile_0"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_124_axis_0 = const()[name = tensor("op_124_axis_0"), val = tensor(1)]; tensor var_124_cast_fp16_0, tensor var_124_cast_fp16_1, tensor var_124_cast_fp16_2, tensor var_124_cast_fp16_3, tensor var_124_cast_fp16_4, tensor var_124_cast_fp16_5, tensor var_124_cast_fp16_6, tensor var_124_cast_fp16_7 = split(axis = var_124_axis_0, split_sizes = tile_0, x = var_123_cast_fp16)[name = tensor("op_124_cast_fp16")]; tensor var_133_perm_0 = const()[name = tensor("op_133_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_1 = const()[name = tensor("tile_1"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_134_axis_0 = const()[name = tensor("op_134_axis_0"), val = tensor(3)]; tensor var_133_cast_fp16 = transpose(perm = var_133_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_6")]; tensor var_134_cast_fp16_0, tensor var_134_cast_fp16_1, tensor var_134_cast_fp16_2, tensor var_134_cast_fp16_3, tensor var_134_cast_fp16_4, tensor var_134_cast_fp16_5, tensor var_134_cast_fp16_6, tensor var_134_cast_fp16_7 = split(axis = var_134_axis_0, split_sizes = tile_1, x = var_133_cast_fp16)[name = tensor("op_134_cast_fp16")]; tensor tile_2 = const()[name = tensor("tile_2"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_143_axis_0 = const()[name = tensor("op_143_axis_0"), val = tensor(1)]; tensor var_143_cast_fp16_0, tensor var_143_cast_fp16_1, tensor var_143_cast_fp16_2, tensor var_143_cast_fp16_3, tensor var_143_cast_fp16_4, tensor var_143_cast_fp16_5, tensor var_143_cast_fp16_6, tensor var_143_cast_fp16_7 = split(axis = var_143_axis_0, split_sizes = tile_2, x = var_121_cast_fp16)[name = tensor("op_143_cast_fp16")]; tensor aw_1_equation_0 = const()[name = tensor("aw_1_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1_cast_fp16 = einsum(equation = aw_1_equation_0, values = (var_134_cast_fp16_0, var_124_cast_fp16_0))[name = tensor("aw_1_cast_fp16")]; tensor aw_3_equation_0 = const()[name = tensor("aw_3_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_3_cast_fp16 = einsum(equation = aw_3_equation_0, values = (var_134_cast_fp16_1, var_124_cast_fp16_1))[name = tensor("aw_3_cast_fp16")]; tensor aw_5_equation_0 = const()[name = tensor("aw_5_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_5_cast_fp16 = einsum(equation = aw_5_equation_0, values = (var_134_cast_fp16_2, var_124_cast_fp16_2))[name = tensor("aw_5_cast_fp16")]; tensor aw_7_equation_0 = const()[name = tensor("aw_7_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_7_cast_fp16 = einsum(equation = aw_7_equation_0, values = (var_134_cast_fp16_3, var_124_cast_fp16_3))[name = tensor("aw_7_cast_fp16")]; tensor aw_9_equation_0 = const()[name = tensor("aw_9_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_9_cast_fp16 = einsum(equation = aw_9_equation_0, values = (var_134_cast_fp16_4, var_124_cast_fp16_4))[name = tensor("aw_9_cast_fp16")]; tensor aw_11_equation_0 = const()[name = tensor("aw_11_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_11_cast_fp16 = einsum(equation = aw_11_equation_0, values = (var_134_cast_fp16_5, var_124_cast_fp16_5))[name = tensor("aw_11_cast_fp16")]; tensor aw_13_equation_0 = const()[name = tensor("aw_13_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_13_cast_fp16 = einsum(equation = aw_13_equation_0, values = (var_134_cast_fp16_6, var_124_cast_fp16_6))[name = tensor("aw_13_cast_fp16")]; tensor aw_15_equation_0 = const()[name = tensor("aw_15_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_15_cast_fp16 = einsum(equation = aw_15_equation_0, values = (var_134_cast_fp16_7, var_124_cast_fp16_7))[name = tensor("aw_15_cast_fp16")]; tensor var_168_cast_fp16 = softmax(axis = var_72, x = aw_1_cast_fp16)[name = tensor("op_168_cast_fp16")]; tensor var_169_cast_fp16 = softmax(axis = var_72, x = aw_3_cast_fp16)[name = tensor("op_169_cast_fp16")]; tensor var_170_cast_fp16 = softmax(axis = var_72, x = aw_5_cast_fp16)[name = tensor("op_170_cast_fp16")]; tensor var_171_cast_fp16 = softmax(axis = var_72, x = aw_7_cast_fp16)[name = tensor("op_171_cast_fp16")]; tensor var_172_cast_fp16 = softmax(axis = var_72, x = aw_9_cast_fp16)[name = tensor("op_172_cast_fp16")]; tensor var_173_cast_fp16 = softmax(axis = var_72, x = aw_11_cast_fp16)[name = tensor("op_173_cast_fp16")]; tensor var_174_cast_fp16 = softmax(axis = var_72, x = aw_13_cast_fp16)[name = tensor("op_174_cast_fp16")]; tensor var_175_cast_fp16 = softmax(axis = var_72, x = aw_15_cast_fp16)[name = tensor("op_175_cast_fp16")]; tensor var_177_equation_0 = const()[name = tensor("op_177_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_177_cast_fp16 = einsum(equation = var_177_equation_0, values = (var_143_cast_fp16_0, var_168_cast_fp16))[name = tensor("op_177_cast_fp16")]; tensor var_179_equation_0 = const()[name = tensor("op_179_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_179_cast_fp16 = einsum(equation = var_179_equation_0, values = (var_143_cast_fp16_1, var_169_cast_fp16))[name = tensor("op_179_cast_fp16")]; tensor var_181_equation_0 = const()[name = tensor("op_181_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_181_cast_fp16 = einsum(equation = var_181_equation_0, values = (var_143_cast_fp16_2, var_170_cast_fp16))[name = tensor("op_181_cast_fp16")]; tensor var_183_equation_0 = const()[name = tensor("op_183_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_183_cast_fp16 = einsum(equation = var_183_equation_0, values = (var_143_cast_fp16_3, var_171_cast_fp16))[name = tensor("op_183_cast_fp16")]; tensor var_185_equation_0 = const()[name = tensor("op_185_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_185_cast_fp16 = einsum(equation = var_185_equation_0, values = (var_143_cast_fp16_4, var_172_cast_fp16))[name = tensor("op_185_cast_fp16")]; tensor var_187_equation_0 = const()[name = tensor("op_187_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_187_cast_fp16 = einsum(equation = var_187_equation_0, values = (var_143_cast_fp16_5, var_173_cast_fp16))[name = tensor("op_187_cast_fp16")]; tensor var_189_equation_0 = const()[name = tensor("op_189_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_189_cast_fp16 = einsum(equation = var_189_equation_0, values = (var_143_cast_fp16_6, var_174_cast_fp16))[name = tensor("op_189_cast_fp16")]; tensor var_191_equation_0 = const()[name = tensor("op_191_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_191_cast_fp16 = einsum(equation = var_191_equation_0, values = (var_143_cast_fp16_7, var_175_cast_fp16))[name = tensor("op_191_cast_fp16")]; tensor input_5_interleave_0 = const()[name = tensor("input_5_interleave_0"), val = tensor(false)]; tensor input_5_cast_fp16 = concat(axis = var_72, interleave = input_5_interleave_0, values = (var_177_cast_fp16, var_179_cast_fp16, var_181_cast_fp16, var_183_cast_fp16, var_185_cast_fp16, var_187_cast_fp16, var_189_cast_fp16, var_191_cast_fp16))[name = tensor("input_5_cast_fp16")]; tensor var_200_pad_type_0 = const()[name = tensor("op_200_pad_type_0"), val = tensor("valid")]; tensor var_200_strides_0 = const()[name = tensor("op_200_strides_0"), val = tensor([1, 1])]; tensor var_200_pad_0 = const()[name = tensor("op_200_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_200_dilations_0 = const()[name = tensor("op_200_dilations_0"), val = tensor([1, 1])]; tensor var_200_groups_0 = const()[name = tensor("op_200_groups_0"), val = tensor(1)]; tensor blocks_0_attn_out_weight_to_fp16 = const()[name = tensor("blocks_0_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4934464)))]; tensor blocks_0_attn_out_bias_to_fp16 = const()[name = tensor("blocks_0_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5458816)))]; tensor var_200_cast_fp16 = conv(bias = blocks_0_attn_out_bias_to_fp16, dilations = var_200_dilations_0, groups = var_200_groups_0, pad = var_200_pad_0, pad_type = var_200_pad_type_0, strides = var_200_strides_0, weight = blocks_0_attn_out_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("op_200_cast_fp16")]; tensor inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = var_200_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor input_7_axes_0 = const()[name = tensor("input_7_axes_0"), val = tensor([1])]; tensor input_7_gamma_0_to_fp16 = const()[name = tensor("input_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5459904)))]; tensor input_7_beta_0_to_fp16 = const()[name = tensor("input_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5460992)))]; tensor var_210_to_fp16 = const()[name = tensor("op_210_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_7_cast_fp16 = layer_norm(axes = input_7_axes_0, beta = input_7_beta_0_to_fp16, epsilon = var_210_to_fp16, gamma = input_7_gamma_0_to_fp16, x = inputs_3_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_pad_type_0 = const()[name = tensor("input_9_pad_type_0"), val = tensor("valid")]; tensor input_9_strides_0 = const()[name = tensor("input_9_strides_0"), val = tensor([1, 1])]; tensor input_9_pad_0 = const()[name = tensor("input_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_9_dilations_0 = const()[name = tensor("input_9_dilations_0"), val = tensor([1, 1])]; tensor input_9_groups_0 = const()[name = tensor("input_9_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5462080)))]; tensor blocks_0_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7559296)))]; tensor input_9_cast_fp16 = conv(bias = blocks_0_mlp_0_bias_to_fp16, dilations = input_9_dilations_0, groups = input_9_groups_0, pad = input_9_pad_0, pad_type = input_9_pad_type_0, strides = input_9_strides_0, weight = blocks_0_mlp_0_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11_cast_fp16 = gelu(mode = input_11_mode_0, x = input_9_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor var_236_pad_type_0 = const()[name = tensor("op_236_pad_type_0"), val = tensor("valid")]; tensor var_236_strides_0 = const()[name = tensor("op_236_strides_0"), val = tensor([1, 1])]; tensor var_236_pad_0 = const()[name = tensor("op_236_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_236_dilations_0 = const()[name = tensor("op_236_dilations_0"), val = tensor([1, 1])]; tensor var_236_groups_0 = const()[name = tensor("op_236_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7563456)))]; tensor blocks_0_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9660672)))]; tensor var_236_cast_fp16 = conv(bias = blocks_0_mlp_2_bias_to_fp16, dilations = var_236_dilations_0, groups = var_236_groups_0, pad = var_236_pad_0, pad_type = var_236_pad_type_0, strides = var_236_strides_0, weight = blocks_0_mlp_2_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("op_236_cast_fp16")]; tensor inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = var_236_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor(1)]; tensor input_13_axes_0 = const()[name = tensor("input_13_axes_0"), val = tensor([1])]; tensor input_13_gamma_0_to_fp16 = const()[name = tensor("input_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9661760)))]; tensor input_13_beta_0_to_fp16 = const()[name = tensor("input_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9662848)))]; tensor var_261_to_fp16 = const()[name = tensor("op_261_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_13_cast_fp16 = layer_norm(axes = input_13_axes_0, beta = input_13_beta_0_to_fp16, epsilon = var_261_to_fp16, gamma = input_13_gamma_0_to_fp16, x = inputs_5_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor q_3_pad_type_0 = const()[name = tensor("q_3_pad_type_0"), val = tensor("valid")]; tensor q_3_strides_0 = const()[name = tensor("q_3_strides_0"), val = tensor([1, 1])]; tensor q_3_pad_0 = const()[name = tensor("q_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_3_dilations_0 = const()[name = tensor("q_3_dilations_0"), val = tensor([1, 1])]; tensor q_3_groups_0 = const()[name = tensor("q_3_groups_0"), val = tensor(1)]; tensor var_296_weight_0_to_fp16 = const()[name = tensor("op_296_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9663936)))]; tensor var_296_bias_0_to_fp16 = const()[name = tensor("op_296_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10188288)))]; tensor var_296_cast_fp16 = conv(bias = var_296_bias_0_to_fp16, dilations = q_3_dilations_0, groups = q_3_groups_0, pad = q_3_pad_0, pad_type = q_3_pad_type_0, strides = q_3_strides_0, weight = var_296_weight_0_to_fp16, x = input_13_cast_fp16)[name = tensor("op_296_cast_fp16")]; tensor k_3_pad_type_0 = const()[name = tensor("k_3_pad_type_0"), val = tensor("valid")]; tensor k_3_strides_0 = const()[name = tensor("k_3_strides_0"), val = tensor([1, 1])]; tensor k_3_pad_0 = const()[name = tensor("k_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_3_dilations_0 = const()[name = tensor("k_3_dilations_0"), val = tensor([1, 1])]; tensor k_3_groups_0 = const()[name = tensor("k_3_groups_0"), val = tensor(1)]; tensor blocks_1_attn_key_weight_to_fp16 = const()[name = tensor("blocks_1_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10189376)))]; tensor k_3_cast_fp16 = conv(dilations = k_3_dilations_0, groups = k_3_groups_0, pad = k_3_pad_0, pad_type = k_3_pad_type_0, strides = k_3_strides_0, weight = blocks_1_attn_key_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_294_pad_type_0 = const()[name = tensor("op_294_pad_type_0"), val = tensor("valid")]; tensor var_294_strides_0 = const()[name = tensor("op_294_strides_0"), val = tensor([1, 1])]; tensor var_294_pad_0 = const()[name = tensor("op_294_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_294_dilations_0 = const()[name = tensor("op_294_dilations_0"), val = tensor([1, 1])]; tensor var_294_groups_0 = const()[name = tensor("op_294_groups_0"), val = tensor(1)]; tensor blocks_1_attn_value_weight_to_fp16 = const()[name = tensor("blocks_1_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10713728)))]; tensor blocks_1_attn_value_bias_to_fp16 = const()[name = tensor("blocks_1_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11238080)))]; tensor var_294_cast_fp16 = conv(bias = blocks_1_attn_value_bias_to_fp16, dilations = var_294_dilations_0, groups = var_294_groups_0, pad = var_294_pad_0, pad_type = var_294_pad_type_0, strides = var_294_strides_0, weight = blocks_1_attn_value_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("op_294_cast_fp16")]; tensor tile_3 = const()[name = tensor("tile_3"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_297_axis_0 = const()[name = tensor("op_297_axis_0"), val = tensor(1)]; tensor var_297_cast_fp16_0, tensor var_297_cast_fp16_1, tensor var_297_cast_fp16_2, tensor var_297_cast_fp16_3, tensor var_297_cast_fp16_4, tensor var_297_cast_fp16_5, tensor var_297_cast_fp16_6, tensor var_297_cast_fp16_7 = split(axis = var_297_axis_0, split_sizes = tile_3, x = var_296_cast_fp16)[name = tensor("op_297_cast_fp16")]; tensor var_306_perm_0 = const()[name = tensor("op_306_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_4 = const()[name = tensor("tile_4"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_307_axis_0 = const()[name = tensor("op_307_axis_0"), val = tensor(3)]; tensor var_306_cast_fp16 = transpose(perm = var_306_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_5")]; tensor var_307_cast_fp16_0, tensor var_307_cast_fp16_1, tensor var_307_cast_fp16_2, tensor var_307_cast_fp16_3, tensor var_307_cast_fp16_4, tensor var_307_cast_fp16_5, tensor var_307_cast_fp16_6, tensor var_307_cast_fp16_7 = split(axis = var_307_axis_0, split_sizes = tile_4, x = var_306_cast_fp16)[name = tensor("op_307_cast_fp16")]; tensor tile_5 = const()[name = tensor("tile_5"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_316_axis_0 = const()[name = tensor("op_316_axis_0"), val = tensor(1)]; tensor var_316_cast_fp16_0, tensor var_316_cast_fp16_1, tensor var_316_cast_fp16_2, tensor var_316_cast_fp16_3, tensor var_316_cast_fp16_4, tensor var_316_cast_fp16_5, tensor var_316_cast_fp16_6, tensor var_316_cast_fp16_7 = split(axis = var_316_axis_0, split_sizes = tile_5, x = var_294_cast_fp16)[name = tensor("op_316_cast_fp16")]; tensor aw_17_equation_0 = const()[name = tensor("aw_17_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_17_cast_fp16 = einsum(equation = aw_17_equation_0, values = (var_307_cast_fp16_0, var_297_cast_fp16_0))[name = tensor("aw_17_cast_fp16")]; tensor aw_19_equation_0 = const()[name = tensor("aw_19_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_19_cast_fp16 = einsum(equation = aw_19_equation_0, values = (var_307_cast_fp16_1, var_297_cast_fp16_1))[name = tensor("aw_19_cast_fp16")]; tensor aw_21_equation_0 = const()[name = tensor("aw_21_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_21_cast_fp16 = einsum(equation = aw_21_equation_0, values = (var_307_cast_fp16_2, var_297_cast_fp16_2))[name = tensor("aw_21_cast_fp16")]; tensor aw_23_equation_0 = const()[name = tensor("aw_23_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_23_cast_fp16 = einsum(equation = aw_23_equation_0, values = (var_307_cast_fp16_3, var_297_cast_fp16_3))[name = tensor("aw_23_cast_fp16")]; tensor aw_25_equation_0 = const()[name = tensor("aw_25_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_25_cast_fp16 = einsum(equation = aw_25_equation_0, values = (var_307_cast_fp16_4, var_297_cast_fp16_4))[name = tensor("aw_25_cast_fp16")]; tensor aw_27_equation_0 = const()[name = tensor("aw_27_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_27_cast_fp16 = einsum(equation = aw_27_equation_0, values = (var_307_cast_fp16_5, var_297_cast_fp16_5))[name = tensor("aw_27_cast_fp16")]; tensor aw_29_equation_0 = const()[name = tensor("aw_29_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_29_cast_fp16 = einsum(equation = aw_29_equation_0, values = (var_307_cast_fp16_6, var_297_cast_fp16_6))[name = tensor("aw_29_cast_fp16")]; tensor aw_31_equation_0 = const()[name = tensor("aw_31_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_31_cast_fp16 = einsum(equation = aw_31_equation_0, values = (var_307_cast_fp16_7, var_297_cast_fp16_7))[name = tensor("aw_31_cast_fp16")]; tensor var_341_cast_fp16 = softmax(axis = var_245, x = aw_17_cast_fp16)[name = tensor("op_341_cast_fp16")]; tensor var_342_cast_fp16 = softmax(axis = var_245, x = aw_19_cast_fp16)[name = tensor("op_342_cast_fp16")]; tensor var_343_cast_fp16 = softmax(axis = var_245, x = aw_21_cast_fp16)[name = tensor("op_343_cast_fp16")]; tensor var_344_cast_fp16 = softmax(axis = var_245, x = aw_23_cast_fp16)[name = tensor("op_344_cast_fp16")]; tensor var_345_cast_fp16 = softmax(axis = var_245, x = aw_25_cast_fp16)[name = tensor("op_345_cast_fp16")]; tensor var_346_cast_fp16 = softmax(axis = var_245, x = aw_27_cast_fp16)[name = tensor("op_346_cast_fp16")]; tensor var_347_cast_fp16 = softmax(axis = var_245, x = aw_29_cast_fp16)[name = tensor("op_347_cast_fp16")]; tensor var_348_cast_fp16 = softmax(axis = var_245, x = aw_31_cast_fp16)[name = tensor("op_348_cast_fp16")]; tensor var_350_equation_0 = const()[name = tensor("op_350_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_350_cast_fp16 = einsum(equation = var_350_equation_0, values = (var_316_cast_fp16_0, var_341_cast_fp16))[name = tensor("op_350_cast_fp16")]; tensor var_352_equation_0 = const()[name = tensor("op_352_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_352_cast_fp16 = einsum(equation = var_352_equation_0, values = (var_316_cast_fp16_1, var_342_cast_fp16))[name = tensor("op_352_cast_fp16")]; tensor var_354_equation_0 = const()[name = tensor("op_354_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_354_cast_fp16 = einsum(equation = var_354_equation_0, values = (var_316_cast_fp16_2, var_343_cast_fp16))[name = tensor("op_354_cast_fp16")]; tensor var_356_equation_0 = const()[name = tensor("op_356_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_356_cast_fp16 = einsum(equation = var_356_equation_0, values = (var_316_cast_fp16_3, var_344_cast_fp16))[name = tensor("op_356_cast_fp16")]; tensor var_358_equation_0 = const()[name = tensor("op_358_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_358_cast_fp16 = einsum(equation = var_358_equation_0, values = (var_316_cast_fp16_4, var_345_cast_fp16))[name = tensor("op_358_cast_fp16")]; tensor var_360_equation_0 = const()[name = tensor("op_360_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_360_cast_fp16 = einsum(equation = var_360_equation_0, values = (var_316_cast_fp16_5, var_346_cast_fp16))[name = tensor("op_360_cast_fp16")]; tensor var_362_equation_0 = const()[name = tensor("op_362_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_362_cast_fp16 = einsum(equation = var_362_equation_0, values = (var_316_cast_fp16_6, var_347_cast_fp16))[name = tensor("op_362_cast_fp16")]; tensor var_364_equation_0 = const()[name = tensor("op_364_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_364_cast_fp16 = einsum(equation = var_364_equation_0, values = (var_316_cast_fp16_7, var_348_cast_fp16))[name = tensor("op_364_cast_fp16")]; tensor input_15_interleave_0 = const()[name = tensor("input_15_interleave_0"), val = tensor(false)]; tensor input_15_cast_fp16 = concat(axis = var_245, interleave = input_15_interleave_0, values = (var_350_cast_fp16, var_352_cast_fp16, var_354_cast_fp16, var_356_cast_fp16, var_358_cast_fp16, var_360_cast_fp16, var_362_cast_fp16, var_364_cast_fp16))[name = tensor("input_15_cast_fp16")]; tensor var_373_pad_type_0 = const()[name = tensor("op_373_pad_type_0"), val = tensor("valid")]; tensor var_373_strides_0 = const()[name = tensor("op_373_strides_0"), val = tensor([1, 1])]; tensor var_373_pad_0 = const()[name = tensor("op_373_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_373_dilations_0 = const()[name = tensor("op_373_dilations_0"), val = tensor([1, 1])]; tensor var_373_groups_0 = const()[name = tensor("op_373_groups_0"), val = tensor(1)]; tensor blocks_1_attn_out_weight_to_fp16 = const()[name = tensor("blocks_1_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11239168)))]; tensor blocks_1_attn_out_bias_to_fp16 = const()[name = tensor("blocks_1_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11763520)))]; tensor var_373_cast_fp16 = conv(bias = blocks_1_attn_out_bias_to_fp16, dilations = var_373_dilations_0, groups = var_373_groups_0, pad = var_373_pad_0, pad_type = var_373_pad_type_0, strides = var_373_strides_0, weight = blocks_1_attn_out_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("op_373_cast_fp16")]; tensor inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = var_373_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor input_17_axes_0 = const()[name = tensor("input_17_axes_0"), val = tensor([1])]; tensor input_17_gamma_0_to_fp16 = const()[name = tensor("input_17_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11764608)))]; tensor input_17_beta_0_to_fp16 = const()[name = tensor("input_17_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11765696)))]; tensor var_383_to_fp16 = const()[name = tensor("op_383_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_17_cast_fp16 = layer_norm(axes = input_17_axes_0, beta = input_17_beta_0_to_fp16, epsilon = var_383_to_fp16, gamma = input_17_gamma_0_to_fp16, x = inputs_7_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_pad_type_0 = const()[name = tensor("input_19_pad_type_0"), val = tensor("valid")]; tensor input_19_strides_0 = const()[name = tensor("input_19_strides_0"), val = tensor([1, 1])]; tensor input_19_pad_0 = const()[name = tensor("input_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_19_dilations_0 = const()[name = tensor("input_19_dilations_0"), val = tensor([1, 1])]; tensor input_19_groups_0 = const()[name = tensor("input_19_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11766784)))]; tensor blocks_1_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13864000)))]; tensor input_19_cast_fp16 = conv(bias = blocks_1_mlp_0_bias_to_fp16, dilations = input_19_dilations_0, groups = input_19_groups_0, pad = input_19_pad_0, pad_type = input_19_pad_type_0, strides = input_19_strides_0, weight = blocks_1_mlp_0_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("EXACT")]; tensor input_21_cast_fp16 = gelu(mode = input_21_mode_0, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_409_pad_type_0 = const()[name = tensor("op_409_pad_type_0"), val = tensor("valid")]; tensor var_409_strides_0 = const()[name = tensor("op_409_strides_0"), val = tensor([1, 1])]; tensor var_409_pad_0 = const()[name = tensor("op_409_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_409_dilations_0 = const()[name = tensor("op_409_dilations_0"), val = tensor([1, 1])]; tensor var_409_groups_0 = const()[name = tensor("op_409_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13868160)))]; tensor blocks_1_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15965376)))]; tensor var_409_cast_fp16 = conv(bias = blocks_1_mlp_2_bias_to_fp16, dilations = var_409_dilations_0, groups = var_409_groups_0, pad = var_409_pad_0, pad_type = var_409_pad_type_0, strides = var_409_strides_0, weight = blocks_1_mlp_2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("op_409_cast_fp16")]; tensor inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = var_409_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor var_418 = const()[name = tensor("op_418"), val = tensor(1)]; tensor input_23_axes_0 = const()[name = tensor("input_23_axes_0"), val = tensor([1])]; tensor input_23_gamma_0_to_fp16 = const()[name = tensor("input_23_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15966464)))]; tensor input_23_beta_0_to_fp16 = const()[name = tensor("input_23_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15967552)))]; tensor var_434_to_fp16 = const()[name = tensor("op_434_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_23_cast_fp16 = layer_norm(axes = input_23_axes_0, beta = input_23_beta_0_to_fp16, epsilon = var_434_to_fp16, gamma = input_23_gamma_0_to_fp16, x = inputs_9_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor q_5_pad_type_0 = const()[name = tensor("q_5_pad_type_0"), val = tensor("valid")]; tensor q_5_strides_0 = const()[name = tensor("q_5_strides_0"), val = tensor([1, 1])]; tensor q_5_pad_0 = const()[name = tensor("q_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_5_dilations_0 = const()[name = tensor("q_5_dilations_0"), val = tensor([1, 1])]; tensor q_5_groups_0 = const()[name = tensor("q_5_groups_0"), val = tensor(1)]; tensor var_469_weight_0_to_fp16 = const()[name = tensor("op_469_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15968640)))]; tensor var_469_bias_0_to_fp16 = const()[name = tensor("op_469_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16492992)))]; tensor var_469_cast_fp16 = conv(bias = var_469_bias_0_to_fp16, dilations = q_5_dilations_0, groups = q_5_groups_0, pad = q_5_pad_0, pad_type = q_5_pad_type_0, strides = q_5_strides_0, weight = var_469_weight_0_to_fp16, x = input_23_cast_fp16)[name = tensor("op_469_cast_fp16")]; tensor k_5_pad_type_0 = const()[name = tensor("k_5_pad_type_0"), val = tensor("valid")]; tensor k_5_strides_0 = const()[name = tensor("k_5_strides_0"), val = tensor([1, 1])]; tensor k_5_pad_0 = const()[name = tensor("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_5_dilations_0 = const()[name = tensor("k_5_dilations_0"), val = tensor([1, 1])]; tensor k_5_groups_0 = const()[name = tensor("k_5_groups_0"), val = tensor(1)]; tensor blocks_2_attn_key_weight_to_fp16 = const()[name = tensor("blocks_2_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16494080)))]; tensor k_5_cast_fp16 = conv(dilations = k_5_dilations_0, groups = k_5_groups_0, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = k_5_strides_0, weight = blocks_2_attn_key_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor var_467_pad_type_0 = const()[name = tensor("op_467_pad_type_0"), val = tensor("valid")]; tensor var_467_strides_0 = const()[name = tensor("op_467_strides_0"), val = tensor([1, 1])]; tensor var_467_pad_0 = const()[name = tensor("op_467_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_467_dilations_0 = const()[name = tensor("op_467_dilations_0"), val = tensor([1, 1])]; tensor var_467_groups_0 = const()[name = tensor("op_467_groups_0"), val = tensor(1)]; tensor blocks_2_attn_value_weight_to_fp16 = const()[name = tensor("blocks_2_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17018432)))]; tensor blocks_2_attn_value_bias_to_fp16 = const()[name = tensor("blocks_2_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17542784)))]; tensor var_467_cast_fp16 = conv(bias = blocks_2_attn_value_bias_to_fp16, dilations = var_467_dilations_0, groups = var_467_groups_0, pad = var_467_pad_0, pad_type = var_467_pad_type_0, strides = var_467_strides_0, weight = blocks_2_attn_value_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("op_467_cast_fp16")]; tensor tile_6 = const()[name = tensor("tile_6"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_470_axis_0 = const()[name = tensor("op_470_axis_0"), val = tensor(1)]; tensor var_470_cast_fp16_0, tensor var_470_cast_fp16_1, tensor var_470_cast_fp16_2, tensor var_470_cast_fp16_3, tensor var_470_cast_fp16_4, tensor var_470_cast_fp16_5, tensor var_470_cast_fp16_6, tensor var_470_cast_fp16_7 = split(axis = var_470_axis_0, split_sizes = tile_6, x = var_469_cast_fp16)[name = tensor("op_470_cast_fp16")]; tensor var_479_perm_0 = const()[name = tensor("op_479_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_7 = const()[name = tensor("tile_7"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_480_axis_0 = const()[name = tensor("op_480_axis_0"), val = tensor(3)]; tensor var_479_cast_fp16 = transpose(perm = var_479_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_4")]; tensor var_480_cast_fp16_0, tensor var_480_cast_fp16_1, tensor var_480_cast_fp16_2, tensor var_480_cast_fp16_3, tensor var_480_cast_fp16_4, tensor var_480_cast_fp16_5, tensor var_480_cast_fp16_6, tensor var_480_cast_fp16_7 = split(axis = var_480_axis_0, split_sizes = tile_7, x = var_479_cast_fp16)[name = tensor("op_480_cast_fp16")]; tensor tile_8 = const()[name = tensor("tile_8"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_489_axis_0 = const()[name = tensor("op_489_axis_0"), val = tensor(1)]; tensor var_489_cast_fp16_0, tensor var_489_cast_fp16_1, tensor var_489_cast_fp16_2, tensor var_489_cast_fp16_3, tensor var_489_cast_fp16_4, tensor var_489_cast_fp16_5, tensor var_489_cast_fp16_6, tensor var_489_cast_fp16_7 = split(axis = var_489_axis_0, split_sizes = tile_8, x = var_467_cast_fp16)[name = tensor("op_489_cast_fp16")]; tensor aw_33_equation_0 = const()[name = tensor("aw_33_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_33_cast_fp16 = einsum(equation = aw_33_equation_0, values = (var_480_cast_fp16_0, var_470_cast_fp16_0))[name = tensor("aw_33_cast_fp16")]; tensor aw_35_equation_0 = const()[name = tensor("aw_35_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_35_cast_fp16 = einsum(equation = aw_35_equation_0, values = (var_480_cast_fp16_1, var_470_cast_fp16_1))[name = tensor("aw_35_cast_fp16")]; tensor aw_37_equation_0 = const()[name = tensor("aw_37_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_37_cast_fp16 = einsum(equation = aw_37_equation_0, values = (var_480_cast_fp16_2, var_470_cast_fp16_2))[name = tensor("aw_37_cast_fp16")]; tensor aw_39_equation_0 = const()[name = tensor("aw_39_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_39_cast_fp16 = einsum(equation = aw_39_equation_0, values = (var_480_cast_fp16_3, var_470_cast_fp16_3))[name = tensor("aw_39_cast_fp16")]; tensor aw_41_equation_0 = const()[name = tensor("aw_41_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_41_cast_fp16 = einsum(equation = aw_41_equation_0, values = (var_480_cast_fp16_4, var_470_cast_fp16_4))[name = tensor("aw_41_cast_fp16")]; tensor aw_43_equation_0 = const()[name = tensor("aw_43_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_43_cast_fp16 = einsum(equation = aw_43_equation_0, values = (var_480_cast_fp16_5, var_470_cast_fp16_5))[name = tensor("aw_43_cast_fp16")]; tensor aw_45_equation_0 = const()[name = tensor("aw_45_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_45_cast_fp16 = einsum(equation = aw_45_equation_0, values = (var_480_cast_fp16_6, var_470_cast_fp16_6))[name = tensor("aw_45_cast_fp16")]; tensor aw_47_equation_0 = const()[name = tensor("aw_47_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_47_cast_fp16 = einsum(equation = aw_47_equation_0, values = (var_480_cast_fp16_7, var_470_cast_fp16_7))[name = tensor("aw_47_cast_fp16")]; tensor var_514_cast_fp16 = softmax(axis = var_418, x = aw_33_cast_fp16)[name = tensor("op_514_cast_fp16")]; tensor var_515_cast_fp16 = softmax(axis = var_418, x = aw_35_cast_fp16)[name = tensor("op_515_cast_fp16")]; tensor var_516_cast_fp16 = softmax(axis = var_418, x = aw_37_cast_fp16)[name = tensor("op_516_cast_fp16")]; tensor var_517_cast_fp16 = softmax(axis = var_418, x = aw_39_cast_fp16)[name = tensor("op_517_cast_fp16")]; tensor var_518_cast_fp16 = softmax(axis = var_418, x = aw_41_cast_fp16)[name = tensor("op_518_cast_fp16")]; tensor var_519_cast_fp16 = softmax(axis = var_418, x = aw_43_cast_fp16)[name = tensor("op_519_cast_fp16")]; tensor var_520_cast_fp16 = softmax(axis = var_418, x = aw_45_cast_fp16)[name = tensor("op_520_cast_fp16")]; tensor var_521_cast_fp16 = softmax(axis = var_418, x = aw_47_cast_fp16)[name = tensor("op_521_cast_fp16")]; tensor var_523_equation_0 = const()[name = tensor("op_523_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_523_cast_fp16 = einsum(equation = var_523_equation_0, values = (var_489_cast_fp16_0, var_514_cast_fp16))[name = tensor("op_523_cast_fp16")]; tensor var_525_equation_0 = const()[name = tensor("op_525_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_525_cast_fp16 = einsum(equation = var_525_equation_0, values = (var_489_cast_fp16_1, var_515_cast_fp16))[name = tensor("op_525_cast_fp16")]; tensor var_527_equation_0 = const()[name = tensor("op_527_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_527_cast_fp16 = einsum(equation = var_527_equation_0, values = (var_489_cast_fp16_2, var_516_cast_fp16))[name = tensor("op_527_cast_fp16")]; tensor var_529_equation_0 = const()[name = tensor("op_529_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_529_cast_fp16 = einsum(equation = var_529_equation_0, values = (var_489_cast_fp16_3, var_517_cast_fp16))[name = tensor("op_529_cast_fp16")]; tensor var_531_equation_0 = const()[name = tensor("op_531_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_531_cast_fp16 = einsum(equation = var_531_equation_0, values = (var_489_cast_fp16_4, var_518_cast_fp16))[name = tensor("op_531_cast_fp16")]; tensor var_533_equation_0 = const()[name = tensor("op_533_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_533_cast_fp16 = einsum(equation = var_533_equation_0, values = (var_489_cast_fp16_5, var_519_cast_fp16))[name = tensor("op_533_cast_fp16")]; tensor var_535_equation_0 = const()[name = tensor("op_535_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_535_cast_fp16 = einsum(equation = var_535_equation_0, values = (var_489_cast_fp16_6, var_520_cast_fp16))[name = tensor("op_535_cast_fp16")]; tensor var_537_equation_0 = const()[name = tensor("op_537_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_537_cast_fp16 = einsum(equation = var_537_equation_0, values = (var_489_cast_fp16_7, var_521_cast_fp16))[name = tensor("op_537_cast_fp16")]; tensor input_25_interleave_0 = const()[name = tensor("input_25_interleave_0"), val = tensor(false)]; tensor input_25_cast_fp16 = concat(axis = var_418, interleave = input_25_interleave_0, values = (var_523_cast_fp16, var_525_cast_fp16, var_527_cast_fp16, var_529_cast_fp16, var_531_cast_fp16, var_533_cast_fp16, var_535_cast_fp16, var_537_cast_fp16))[name = tensor("input_25_cast_fp16")]; tensor var_546_pad_type_0 = const()[name = tensor("op_546_pad_type_0"), val = tensor("valid")]; tensor var_546_strides_0 = const()[name = tensor("op_546_strides_0"), val = tensor([1, 1])]; tensor var_546_pad_0 = const()[name = tensor("op_546_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_546_dilations_0 = const()[name = tensor("op_546_dilations_0"), val = tensor([1, 1])]; tensor var_546_groups_0 = const()[name = tensor("op_546_groups_0"), val = tensor(1)]; tensor blocks_2_attn_out_weight_to_fp16 = const()[name = tensor("blocks_2_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17543872)))]; tensor blocks_2_attn_out_bias_to_fp16 = const()[name = tensor("blocks_2_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18068224)))]; tensor var_546_cast_fp16 = conv(bias = blocks_2_attn_out_bias_to_fp16, dilations = var_546_dilations_0, groups = var_546_groups_0, pad = var_546_pad_0, pad_type = var_546_pad_type_0, strides = var_546_strides_0, weight = blocks_2_attn_out_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("op_546_cast_fp16")]; tensor inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = var_546_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor input_27_axes_0 = const()[name = tensor("input_27_axes_0"), val = tensor([1])]; tensor input_27_gamma_0_to_fp16 = const()[name = tensor("input_27_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18069312)))]; tensor input_27_beta_0_to_fp16 = const()[name = tensor("input_27_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18070400)))]; tensor var_556_to_fp16 = const()[name = tensor("op_556_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_27_cast_fp16 = layer_norm(axes = input_27_axes_0, beta = input_27_beta_0_to_fp16, epsilon = var_556_to_fp16, gamma = input_27_gamma_0_to_fp16, x = inputs_11_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_pad_type_0 = const()[name = tensor("input_29_pad_type_0"), val = tensor("valid")]; tensor input_29_strides_0 = const()[name = tensor("input_29_strides_0"), val = tensor([1, 1])]; tensor input_29_pad_0 = const()[name = tensor("input_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_29_dilations_0 = const()[name = tensor("input_29_dilations_0"), val = tensor([1, 1])]; tensor input_29_groups_0 = const()[name = tensor("input_29_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18071488)))]; tensor blocks_2_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20168704)))]; tensor input_29_cast_fp16 = conv(bias = blocks_2_mlp_0_bias_to_fp16, dilations = input_29_dilations_0, groups = input_29_groups_0, pad = input_29_pad_0, pad_type = input_29_pad_type_0, strides = input_29_strides_0, weight = blocks_2_mlp_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = input_29_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor var_582_pad_type_0 = const()[name = tensor("op_582_pad_type_0"), val = tensor("valid")]; tensor var_582_strides_0 = const()[name = tensor("op_582_strides_0"), val = tensor([1, 1])]; tensor var_582_pad_0 = const()[name = tensor("op_582_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_582_dilations_0 = const()[name = tensor("op_582_dilations_0"), val = tensor([1, 1])]; tensor var_582_groups_0 = const()[name = tensor("op_582_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20172864)))]; tensor blocks_2_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22270080)))]; tensor var_582_cast_fp16 = conv(bias = blocks_2_mlp_2_bias_to_fp16, dilations = var_582_dilations_0, groups = var_582_groups_0, pad = var_582_pad_0, pad_type = var_582_pad_type_0, strides = var_582_strides_0, weight = blocks_2_mlp_2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("op_582_cast_fp16")]; tensor inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = var_582_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor var_591 = const()[name = tensor("op_591"), val = tensor(1)]; tensor input_33_axes_0 = const()[name = tensor("input_33_axes_0"), val = tensor([1])]; tensor input_33_gamma_0_to_fp16 = const()[name = tensor("input_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22271168)))]; tensor input_33_beta_0_to_fp16 = const()[name = tensor("input_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22272256)))]; tensor var_607_to_fp16 = const()[name = tensor("op_607_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_33_cast_fp16 = layer_norm(axes = input_33_axes_0, beta = input_33_beta_0_to_fp16, epsilon = var_607_to_fp16, gamma = input_33_gamma_0_to_fp16, x = inputs_13_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor q_7_pad_type_0 = const()[name = tensor("q_7_pad_type_0"), val = tensor("valid")]; tensor q_7_strides_0 = const()[name = tensor("q_7_strides_0"), val = tensor([1, 1])]; tensor q_7_pad_0 = const()[name = tensor("q_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_7_dilations_0 = const()[name = tensor("q_7_dilations_0"), val = tensor([1, 1])]; tensor q_7_groups_0 = const()[name = tensor("q_7_groups_0"), val = tensor(1)]; tensor var_642_weight_0_to_fp16 = const()[name = tensor("op_642_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22273344)))]; tensor var_642_bias_0_to_fp16 = const()[name = tensor("op_642_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22797696)))]; tensor var_642_cast_fp16 = conv(bias = var_642_bias_0_to_fp16, dilations = q_7_dilations_0, groups = q_7_groups_0, pad = q_7_pad_0, pad_type = q_7_pad_type_0, strides = q_7_strides_0, weight = var_642_weight_0_to_fp16, x = input_33_cast_fp16)[name = tensor("op_642_cast_fp16")]; tensor k_7_pad_type_0 = const()[name = tensor("k_7_pad_type_0"), val = tensor("valid")]; tensor k_7_strides_0 = const()[name = tensor("k_7_strides_0"), val = tensor([1, 1])]; tensor k_7_pad_0 = const()[name = tensor("k_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_7_dilations_0 = const()[name = tensor("k_7_dilations_0"), val = tensor([1, 1])]; tensor k_7_groups_0 = const()[name = tensor("k_7_groups_0"), val = tensor(1)]; tensor blocks_3_attn_key_weight_to_fp16 = const()[name = tensor("blocks_3_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22798784)))]; tensor k_7_cast_fp16 = conv(dilations = k_7_dilations_0, groups = k_7_groups_0, pad = k_7_pad_0, pad_type = k_7_pad_type_0, strides = k_7_strides_0, weight = blocks_3_attn_key_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("k_7_cast_fp16")]; tensor var_640_pad_type_0 = const()[name = tensor("op_640_pad_type_0"), val = tensor("valid")]; tensor var_640_strides_0 = const()[name = tensor("op_640_strides_0"), val = tensor([1, 1])]; tensor var_640_pad_0 = const()[name = tensor("op_640_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_640_dilations_0 = const()[name = tensor("op_640_dilations_0"), val = tensor([1, 1])]; tensor var_640_groups_0 = const()[name = tensor("op_640_groups_0"), val = tensor(1)]; tensor blocks_3_attn_value_weight_to_fp16 = const()[name = tensor("blocks_3_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23323136)))]; tensor blocks_3_attn_value_bias_to_fp16 = const()[name = tensor("blocks_3_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23847488)))]; tensor var_640_cast_fp16 = conv(bias = blocks_3_attn_value_bias_to_fp16, dilations = var_640_dilations_0, groups = var_640_groups_0, pad = var_640_pad_0, pad_type = var_640_pad_type_0, strides = var_640_strides_0, weight = blocks_3_attn_value_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("op_640_cast_fp16")]; tensor tile_9 = const()[name = tensor("tile_9"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_643_axis_0 = const()[name = tensor("op_643_axis_0"), val = tensor(1)]; tensor var_643_cast_fp16_0, tensor var_643_cast_fp16_1, tensor var_643_cast_fp16_2, tensor var_643_cast_fp16_3, tensor var_643_cast_fp16_4, tensor var_643_cast_fp16_5, tensor var_643_cast_fp16_6, tensor var_643_cast_fp16_7 = split(axis = var_643_axis_0, split_sizes = tile_9, x = var_642_cast_fp16)[name = tensor("op_643_cast_fp16")]; tensor var_652_perm_0 = const()[name = tensor("op_652_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_10 = const()[name = tensor("tile_10"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_653_axis_0 = const()[name = tensor("op_653_axis_0"), val = tensor(3)]; tensor var_652_cast_fp16 = transpose(perm = var_652_perm_0, x = k_7_cast_fp16)[name = tensor("transpose_3")]; tensor var_653_cast_fp16_0, tensor var_653_cast_fp16_1, tensor var_653_cast_fp16_2, tensor var_653_cast_fp16_3, tensor var_653_cast_fp16_4, tensor var_653_cast_fp16_5, tensor var_653_cast_fp16_6, tensor var_653_cast_fp16_7 = split(axis = var_653_axis_0, split_sizes = tile_10, x = var_652_cast_fp16)[name = tensor("op_653_cast_fp16")]; tensor tile_11 = const()[name = tensor("tile_11"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_662_axis_0 = const()[name = tensor("op_662_axis_0"), val = tensor(1)]; tensor var_662_cast_fp16_0, tensor var_662_cast_fp16_1, tensor var_662_cast_fp16_2, tensor var_662_cast_fp16_3, tensor var_662_cast_fp16_4, tensor var_662_cast_fp16_5, tensor var_662_cast_fp16_6, tensor var_662_cast_fp16_7 = split(axis = var_662_axis_0, split_sizes = tile_11, x = var_640_cast_fp16)[name = tensor("op_662_cast_fp16")]; tensor aw_49_equation_0 = const()[name = tensor("aw_49_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_49_cast_fp16 = einsum(equation = aw_49_equation_0, values = (var_653_cast_fp16_0, var_643_cast_fp16_0))[name = tensor("aw_49_cast_fp16")]; tensor aw_51_equation_0 = const()[name = tensor("aw_51_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_51_cast_fp16 = einsum(equation = aw_51_equation_0, values = (var_653_cast_fp16_1, var_643_cast_fp16_1))[name = tensor("aw_51_cast_fp16")]; tensor aw_53_equation_0 = const()[name = tensor("aw_53_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_53_cast_fp16 = einsum(equation = aw_53_equation_0, values = (var_653_cast_fp16_2, var_643_cast_fp16_2))[name = tensor("aw_53_cast_fp16")]; tensor aw_55_equation_0 = const()[name = tensor("aw_55_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_55_cast_fp16 = einsum(equation = aw_55_equation_0, values = (var_653_cast_fp16_3, var_643_cast_fp16_3))[name = tensor("aw_55_cast_fp16")]; tensor aw_57_equation_0 = const()[name = tensor("aw_57_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_57_cast_fp16 = einsum(equation = aw_57_equation_0, values = (var_653_cast_fp16_4, var_643_cast_fp16_4))[name = tensor("aw_57_cast_fp16")]; tensor aw_59_equation_0 = const()[name = tensor("aw_59_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_59_cast_fp16 = einsum(equation = aw_59_equation_0, values = (var_653_cast_fp16_5, var_643_cast_fp16_5))[name = tensor("aw_59_cast_fp16")]; tensor aw_61_equation_0 = const()[name = tensor("aw_61_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_61_cast_fp16 = einsum(equation = aw_61_equation_0, values = (var_653_cast_fp16_6, var_643_cast_fp16_6))[name = tensor("aw_61_cast_fp16")]; tensor aw_63_equation_0 = const()[name = tensor("aw_63_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_63_cast_fp16 = einsum(equation = aw_63_equation_0, values = (var_653_cast_fp16_7, var_643_cast_fp16_7))[name = tensor("aw_63_cast_fp16")]; tensor var_687_cast_fp16 = softmax(axis = var_591, x = aw_49_cast_fp16)[name = tensor("op_687_cast_fp16")]; tensor var_688_cast_fp16 = softmax(axis = var_591, x = aw_51_cast_fp16)[name = tensor("op_688_cast_fp16")]; tensor var_689_cast_fp16 = softmax(axis = var_591, x = aw_53_cast_fp16)[name = tensor("op_689_cast_fp16")]; tensor var_690_cast_fp16 = softmax(axis = var_591, x = aw_55_cast_fp16)[name = tensor("op_690_cast_fp16")]; tensor var_691_cast_fp16 = softmax(axis = var_591, x = aw_57_cast_fp16)[name = tensor("op_691_cast_fp16")]; tensor var_692_cast_fp16 = softmax(axis = var_591, x = aw_59_cast_fp16)[name = tensor("op_692_cast_fp16")]; tensor var_693_cast_fp16 = softmax(axis = var_591, x = aw_61_cast_fp16)[name = tensor("op_693_cast_fp16")]; tensor var_694_cast_fp16 = softmax(axis = var_591, x = aw_63_cast_fp16)[name = tensor("op_694_cast_fp16")]; tensor var_696_equation_0 = const()[name = tensor("op_696_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_696_cast_fp16 = einsum(equation = var_696_equation_0, values = (var_662_cast_fp16_0, var_687_cast_fp16))[name = tensor("op_696_cast_fp16")]; tensor var_698_equation_0 = const()[name = tensor("op_698_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_698_cast_fp16 = einsum(equation = var_698_equation_0, values = (var_662_cast_fp16_1, var_688_cast_fp16))[name = tensor("op_698_cast_fp16")]; tensor var_700_equation_0 = const()[name = tensor("op_700_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_700_cast_fp16 = einsum(equation = var_700_equation_0, values = (var_662_cast_fp16_2, var_689_cast_fp16))[name = tensor("op_700_cast_fp16")]; tensor var_702_equation_0 = const()[name = tensor("op_702_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_702_cast_fp16 = einsum(equation = var_702_equation_0, values = (var_662_cast_fp16_3, var_690_cast_fp16))[name = tensor("op_702_cast_fp16")]; tensor var_704_equation_0 = const()[name = tensor("op_704_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_704_cast_fp16 = einsum(equation = var_704_equation_0, values = (var_662_cast_fp16_4, var_691_cast_fp16))[name = tensor("op_704_cast_fp16")]; tensor var_706_equation_0 = const()[name = tensor("op_706_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_706_cast_fp16 = einsum(equation = var_706_equation_0, values = (var_662_cast_fp16_5, var_692_cast_fp16))[name = tensor("op_706_cast_fp16")]; tensor var_708_equation_0 = const()[name = tensor("op_708_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_708_cast_fp16 = einsum(equation = var_708_equation_0, values = (var_662_cast_fp16_6, var_693_cast_fp16))[name = tensor("op_708_cast_fp16")]; tensor var_710_equation_0 = const()[name = tensor("op_710_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_710_cast_fp16 = einsum(equation = var_710_equation_0, values = (var_662_cast_fp16_7, var_694_cast_fp16))[name = tensor("op_710_cast_fp16")]; tensor input_35_interleave_0 = const()[name = tensor("input_35_interleave_0"), val = tensor(false)]; tensor input_35_cast_fp16 = concat(axis = var_591, interleave = input_35_interleave_0, values = (var_696_cast_fp16, var_698_cast_fp16, var_700_cast_fp16, var_702_cast_fp16, var_704_cast_fp16, var_706_cast_fp16, var_708_cast_fp16, var_710_cast_fp16))[name = tensor("input_35_cast_fp16")]; tensor var_719_pad_type_0 = const()[name = tensor("op_719_pad_type_0"), val = tensor("valid")]; tensor var_719_strides_0 = const()[name = tensor("op_719_strides_0"), val = tensor([1, 1])]; tensor var_719_pad_0 = const()[name = tensor("op_719_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_719_dilations_0 = const()[name = tensor("op_719_dilations_0"), val = tensor([1, 1])]; tensor var_719_groups_0 = const()[name = tensor("op_719_groups_0"), val = tensor(1)]; tensor blocks_3_attn_out_weight_to_fp16 = const()[name = tensor("blocks_3_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23848576)))]; tensor blocks_3_attn_out_bias_to_fp16 = const()[name = tensor("blocks_3_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24372928)))]; tensor var_719_cast_fp16 = conv(bias = blocks_3_attn_out_bias_to_fp16, dilations = var_719_dilations_0, groups = var_719_groups_0, pad = var_719_pad_0, pad_type = var_719_pad_type_0, strides = var_719_strides_0, weight = blocks_3_attn_out_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("op_719_cast_fp16")]; tensor inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = var_719_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor input_37_axes_0 = const()[name = tensor("input_37_axes_0"), val = tensor([1])]; tensor input_37_gamma_0_to_fp16 = const()[name = tensor("input_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24374016)))]; tensor input_37_beta_0_to_fp16 = const()[name = tensor("input_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24375104)))]; tensor var_729_to_fp16 = const()[name = tensor("op_729_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_37_cast_fp16 = layer_norm(axes = input_37_axes_0, beta = input_37_beta_0_to_fp16, epsilon = var_729_to_fp16, gamma = input_37_gamma_0_to_fp16, x = inputs_15_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor input_39_pad_type_0 = const()[name = tensor("input_39_pad_type_0"), val = tensor("valid")]; tensor input_39_strides_0 = const()[name = tensor("input_39_strides_0"), val = tensor([1, 1])]; tensor input_39_pad_0 = const()[name = tensor("input_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_39_dilations_0 = const()[name = tensor("input_39_dilations_0"), val = tensor([1, 1])]; tensor input_39_groups_0 = const()[name = tensor("input_39_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24376192)))]; tensor blocks_3_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26473408)))]; tensor input_39_cast_fp16 = conv(bias = blocks_3_mlp_0_bias_to_fp16, dilations = input_39_dilations_0, groups = input_39_groups_0, pad = input_39_pad_0, pad_type = input_39_pad_type_0, strides = input_39_strides_0, weight = blocks_3_mlp_0_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("EXACT")]; tensor input_41_cast_fp16 = gelu(mode = input_41_mode_0, x = input_39_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor var_755_pad_type_0 = const()[name = tensor("op_755_pad_type_0"), val = tensor("valid")]; tensor var_755_strides_0 = const()[name = tensor("op_755_strides_0"), val = tensor([1, 1])]; tensor var_755_pad_0 = const()[name = tensor("op_755_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_755_dilations_0 = const()[name = tensor("op_755_dilations_0"), val = tensor([1, 1])]; tensor var_755_groups_0 = const()[name = tensor("op_755_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26477568)))]; tensor blocks_3_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28574784)))]; tensor var_755_cast_fp16 = conv(bias = blocks_3_mlp_2_bias_to_fp16, dilations = var_755_dilations_0, groups = var_755_groups_0, pad = var_755_pad_0, pad_type = var_755_pad_type_0, strides = var_755_strides_0, weight = blocks_3_mlp_2_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("op_755_cast_fp16")]; tensor inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = var_755_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; tensor var_764 = const()[name = tensor("op_764"), val = tensor(1)]; tensor input_43_axes_0 = const()[name = tensor("input_43_axes_0"), val = tensor([1])]; tensor input_43_gamma_0_to_fp16 = const()[name = tensor("input_43_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28575872)))]; tensor input_43_beta_0_to_fp16 = const()[name = tensor("input_43_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28576960)))]; tensor var_780_to_fp16 = const()[name = tensor("op_780_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_43_cast_fp16 = layer_norm(axes = input_43_axes_0, beta = input_43_beta_0_to_fp16, epsilon = var_780_to_fp16, gamma = input_43_gamma_0_to_fp16, x = inputs_17_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor q_9_pad_type_0 = const()[name = tensor("q_9_pad_type_0"), val = tensor("valid")]; tensor q_9_strides_0 = const()[name = tensor("q_9_strides_0"), val = tensor([1, 1])]; tensor q_9_pad_0 = const()[name = tensor("q_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_9_dilations_0 = const()[name = tensor("q_9_dilations_0"), val = tensor([1, 1])]; tensor q_9_groups_0 = const()[name = tensor("q_9_groups_0"), val = tensor(1)]; tensor var_815_weight_0_to_fp16 = const()[name = tensor("op_815_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28578048)))]; tensor var_815_bias_0_to_fp16 = const()[name = tensor("op_815_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29102400)))]; tensor var_815_cast_fp16 = conv(bias = var_815_bias_0_to_fp16, dilations = q_9_dilations_0, groups = q_9_groups_0, pad = q_9_pad_0, pad_type = q_9_pad_type_0, strides = q_9_strides_0, weight = var_815_weight_0_to_fp16, x = input_43_cast_fp16)[name = tensor("op_815_cast_fp16")]; tensor k_9_pad_type_0 = const()[name = tensor("k_9_pad_type_0"), val = tensor("valid")]; tensor k_9_strides_0 = const()[name = tensor("k_9_strides_0"), val = tensor([1, 1])]; tensor k_9_pad_0 = const()[name = tensor("k_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_9_dilations_0 = const()[name = tensor("k_9_dilations_0"), val = tensor([1, 1])]; tensor k_9_groups_0 = const()[name = tensor("k_9_groups_0"), val = tensor(1)]; tensor blocks_4_attn_key_weight_to_fp16 = const()[name = tensor("blocks_4_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29103488)))]; tensor k_9_cast_fp16 = conv(dilations = k_9_dilations_0, groups = k_9_groups_0, pad = k_9_pad_0, pad_type = k_9_pad_type_0, strides = k_9_strides_0, weight = blocks_4_attn_key_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor var_813_pad_type_0 = const()[name = tensor("op_813_pad_type_0"), val = tensor("valid")]; tensor var_813_strides_0 = const()[name = tensor("op_813_strides_0"), val = tensor([1, 1])]; tensor var_813_pad_0 = const()[name = tensor("op_813_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_813_dilations_0 = const()[name = tensor("op_813_dilations_0"), val = tensor([1, 1])]; tensor var_813_groups_0 = const()[name = tensor("op_813_groups_0"), val = tensor(1)]; tensor blocks_4_attn_value_weight_to_fp16 = const()[name = tensor("blocks_4_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29627840)))]; tensor blocks_4_attn_value_bias_to_fp16 = const()[name = tensor("blocks_4_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30152192)))]; tensor var_813_cast_fp16 = conv(bias = blocks_4_attn_value_bias_to_fp16, dilations = var_813_dilations_0, groups = var_813_groups_0, pad = var_813_pad_0, pad_type = var_813_pad_type_0, strides = var_813_strides_0, weight = blocks_4_attn_value_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("op_813_cast_fp16")]; tensor tile_12 = const()[name = tensor("tile_12"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_816_axis_0 = const()[name = tensor("op_816_axis_0"), val = tensor(1)]; tensor var_816_cast_fp16_0, tensor var_816_cast_fp16_1, tensor var_816_cast_fp16_2, tensor var_816_cast_fp16_3, tensor var_816_cast_fp16_4, tensor var_816_cast_fp16_5, tensor var_816_cast_fp16_6, tensor var_816_cast_fp16_7 = split(axis = var_816_axis_0, split_sizes = tile_12, x = var_815_cast_fp16)[name = tensor("op_816_cast_fp16")]; tensor var_825_perm_0 = const()[name = tensor("op_825_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_13 = const()[name = tensor("tile_13"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_826_axis_0 = const()[name = tensor("op_826_axis_0"), val = tensor(3)]; tensor var_825_cast_fp16 = transpose(perm = var_825_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_2")]; tensor var_826_cast_fp16_0, tensor var_826_cast_fp16_1, tensor var_826_cast_fp16_2, tensor var_826_cast_fp16_3, tensor var_826_cast_fp16_4, tensor var_826_cast_fp16_5, tensor var_826_cast_fp16_6, tensor var_826_cast_fp16_7 = split(axis = var_826_axis_0, split_sizes = tile_13, x = var_825_cast_fp16)[name = tensor("op_826_cast_fp16")]; tensor tile_14 = const()[name = tensor("tile_14"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_835_axis_0 = const()[name = tensor("op_835_axis_0"), val = tensor(1)]; tensor var_835_cast_fp16_0, tensor var_835_cast_fp16_1, tensor var_835_cast_fp16_2, tensor var_835_cast_fp16_3, tensor var_835_cast_fp16_4, tensor var_835_cast_fp16_5, tensor var_835_cast_fp16_6, tensor var_835_cast_fp16_7 = split(axis = var_835_axis_0, split_sizes = tile_14, x = var_813_cast_fp16)[name = tensor("op_835_cast_fp16")]; tensor aw_65_equation_0 = const()[name = tensor("aw_65_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_65_cast_fp16 = einsum(equation = aw_65_equation_0, values = (var_826_cast_fp16_0, var_816_cast_fp16_0))[name = tensor("aw_65_cast_fp16")]; tensor aw_67_equation_0 = const()[name = tensor("aw_67_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_67_cast_fp16 = einsum(equation = aw_67_equation_0, values = (var_826_cast_fp16_1, var_816_cast_fp16_1))[name = tensor("aw_67_cast_fp16")]; tensor aw_69_equation_0 = const()[name = tensor("aw_69_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_69_cast_fp16 = einsum(equation = aw_69_equation_0, values = (var_826_cast_fp16_2, var_816_cast_fp16_2))[name = tensor("aw_69_cast_fp16")]; tensor aw_71_equation_0 = const()[name = tensor("aw_71_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_71_cast_fp16 = einsum(equation = aw_71_equation_0, values = (var_826_cast_fp16_3, var_816_cast_fp16_3))[name = tensor("aw_71_cast_fp16")]; tensor aw_73_equation_0 = const()[name = tensor("aw_73_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_73_cast_fp16 = einsum(equation = aw_73_equation_0, values = (var_826_cast_fp16_4, var_816_cast_fp16_4))[name = tensor("aw_73_cast_fp16")]; tensor aw_75_equation_0 = const()[name = tensor("aw_75_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_75_cast_fp16 = einsum(equation = aw_75_equation_0, values = (var_826_cast_fp16_5, var_816_cast_fp16_5))[name = tensor("aw_75_cast_fp16")]; tensor aw_77_equation_0 = const()[name = tensor("aw_77_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_77_cast_fp16 = einsum(equation = aw_77_equation_0, values = (var_826_cast_fp16_6, var_816_cast_fp16_6))[name = tensor("aw_77_cast_fp16")]; tensor aw_79_equation_0 = const()[name = tensor("aw_79_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_79_cast_fp16 = einsum(equation = aw_79_equation_0, values = (var_826_cast_fp16_7, var_816_cast_fp16_7))[name = tensor("aw_79_cast_fp16")]; tensor var_860_cast_fp16 = softmax(axis = var_764, x = aw_65_cast_fp16)[name = tensor("op_860_cast_fp16")]; tensor var_861_cast_fp16 = softmax(axis = var_764, x = aw_67_cast_fp16)[name = tensor("op_861_cast_fp16")]; tensor var_862_cast_fp16 = softmax(axis = var_764, x = aw_69_cast_fp16)[name = tensor("op_862_cast_fp16")]; tensor var_863_cast_fp16 = softmax(axis = var_764, x = aw_71_cast_fp16)[name = tensor("op_863_cast_fp16")]; tensor var_864_cast_fp16 = softmax(axis = var_764, x = aw_73_cast_fp16)[name = tensor("op_864_cast_fp16")]; tensor var_865_cast_fp16 = softmax(axis = var_764, x = aw_75_cast_fp16)[name = tensor("op_865_cast_fp16")]; tensor var_866_cast_fp16 = softmax(axis = var_764, x = aw_77_cast_fp16)[name = tensor("op_866_cast_fp16")]; tensor var_867_cast_fp16 = softmax(axis = var_764, x = aw_79_cast_fp16)[name = tensor("op_867_cast_fp16")]; tensor var_869_equation_0 = const()[name = tensor("op_869_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_869_cast_fp16 = einsum(equation = var_869_equation_0, values = (var_835_cast_fp16_0, var_860_cast_fp16))[name = tensor("op_869_cast_fp16")]; tensor var_871_equation_0 = const()[name = tensor("op_871_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_871_cast_fp16 = einsum(equation = var_871_equation_0, values = (var_835_cast_fp16_1, var_861_cast_fp16))[name = tensor("op_871_cast_fp16")]; tensor var_873_equation_0 = const()[name = tensor("op_873_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_873_cast_fp16 = einsum(equation = var_873_equation_0, values = (var_835_cast_fp16_2, var_862_cast_fp16))[name = tensor("op_873_cast_fp16")]; tensor var_875_equation_0 = const()[name = tensor("op_875_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_875_cast_fp16 = einsum(equation = var_875_equation_0, values = (var_835_cast_fp16_3, var_863_cast_fp16))[name = tensor("op_875_cast_fp16")]; tensor var_877_equation_0 = const()[name = tensor("op_877_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_877_cast_fp16 = einsum(equation = var_877_equation_0, values = (var_835_cast_fp16_4, var_864_cast_fp16))[name = tensor("op_877_cast_fp16")]; tensor var_879_equation_0 = const()[name = tensor("op_879_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_879_cast_fp16 = einsum(equation = var_879_equation_0, values = (var_835_cast_fp16_5, var_865_cast_fp16))[name = tensor("op_879_cast_fp16")]; tensor var_881_equation_0 = const()[name = tensor("op_881_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_881_cast_fp16 = einsum(equation = var_881_equation_0, values = (var_835_cast_fp16_6, var_866_cast_fp16))[name = tensor("op_881_cast_fp16")]; tensor var_883_equation_0 = const()[name = tensor("op_883_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_883_cast_fp16 = einsum(equation = var_883_equation_0, values = (var_835_cast_fp16_7, var_867_cast_fp16))[name = tensor("op_883_cast_fp16")]; tensor input_45_interleave_0 = const()[name = tensor("input_45_interleave_0"), val = tensor(false)]; tensor input_45_cast_fp16 = concat(axis = var_764, interleave = input_45_interleave_0, values = (var_869_cast_fp16, var_871_cast_fp16, var_873_cast_fp16, var_875_cast_fp16, var_877_cast_fp16, var_879_cast_fp16, var_881_cast_fp16, var_883_cast_fp16))[name = tensor("input_45_cast_fp16")]; tensor var_892_pad_type_0 = const()[name = tensor("op_892_pad_type_0"), val = tensor("valid")]; tensor var_892_strides_0 = const()[name = tensor("op_892_strides_0"), val = tensor([1, 1])]; tensor var_892_pad_0 = const()[name = tensor("op_892_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_892_dilations_0 = const()[name = tensor("op_892_dilations_0"), val = tensor([1, 1])]; tensor var_892_groups_0 = const()[name = tensor("op_892_groups_0"), val = tensor(1)]; tensor blocks_4_attn_out_weight_to_fp16 = const()[name = tensor("blocks_4_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30153280)))]; tensor blocks_4_attn_out_bias_to_fp16 = const()[name = tensor("blocks_4_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30677632)))]; tensor var_892_cast_fp16 = conv(bias = blocks_4_attn_out_bias_to_fp16, dilations = var_892_dilations_0, groups = var_892_groups_0, pad = var_892_pad_0, pad_type = var_892_pad_type_0, strides = var_892_strides_0, weight = blocks_4_attn_out_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("op_892_cast_fp16")]; tensor inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = var_892_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; tensor input_47_axes_0 = const()[name = tensor("input_47_axes_0"), val = tensor([1])]; tensor input_47_gamma_0_to_fp16 = const()[name = tensor("input_47_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30678720)))]; tensor input_47_beta_0_to_fp16 = const()[name = tensor("input_47_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30679808)))]; tensor var_902_to_fp16 = const()[name = tensor("op_902_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_47_cast_fp16 = layer_norm(axes = input_47_axes_0, beta = input_47_beta_0_to_fp16, epsilon = var_902_to_fp16, gamma = input_47_gamma_0_to_fp16, x = inputs_19_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor input_49_pad_type_0 = const()[name = tensor("input_49_pad_type_0"), val = tensor("valid")]; tensor input_49_strides_0 = const()[name = tensor("input_49_strides_0"), val = tensor([1, 1])]; tensor input_49_pad_0 = const()[name = tensor("input_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_49_dilations_0 = const()[name = tensor("input_49_dilations_0"), val = tensor([1, 1])]; tensor input_49_groups_0 = const()[name = tensor("input_49_groups_0"), val = tensor(1)]; tensor blocks_4_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30680896)))]; tensor blocks_4_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32778112)))]; tensor input_49_cast_fp16 = conv(bias = blocks_4_mlp_0_bias_to_fp16, dilations = input_49_dilations_0, groups = input_49_groups_0, pad = input_49_pad_0, pad_type = input_49_pad_type_0, strides = input_49_strides_0, weight = blocks_4_mlp_0_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor input_51_mode_0 = const()[name = tensor("input_51_mode_0"), val = tensor("EXACT")]; tensor input_51_cast_fp16 = gelu(mode = input_51_mode_0, x = input_49_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor var_928_pad_type_0 = const()[name = tensor("op_928_pad_type_0"), val = tensor("valid")]; tensor var_928_strides_0 = const()[name = tensor("op_928_strides_0"), val = tensor([1, 1])]; tensor var_928_pad_0 = const()[name = tensor("op_928_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_928_dilations_0 = const()[name = tensor("op_928_dilations_0"), val = tensor([1, 1])]; tensor var_928_groups_0 = const()[name = tensor("op_928_groups_0"), val = tensor(1)]; tensor blocks_4_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32782272)))]; tensor blocks_4_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34879488)))]; tensor var_928_cast_fp16 = conv(bias = blocks_4_mlp_2_bias_to_fp16, dilations = var_928_dilations_0, groups = var_928_groups_0, pad = var_928_pad_0, pad_type = var_928_pad_type_0, strides = var_928_strides_0, weight = blocks_4_mlp_2_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("op_928_cast_fp16")]; tensor inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = var_928_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; tensor var_937 = const()[name = tensor("op_937"), val = tensor(1)]; tensor input_53_axes_0 = const()[name = tensor("input_53_axes_0"), val = tensor([1])]; tensor input_53_gamma_0_to_fp16 = const()[name = tensor("input_53_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34880576)))]; tensor input_53_beta_0_to_fp16 = const()[name = tensor("input_53_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34881664)))]; tensor var_953_to_fp16 = const()[name = tensor("op_953_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_53_cast_fp16 = layer_norm(axes = input_53_axes_0, beta = input_53_beta_0_to_fp16, epsilon = var_953_to_fp16, gamma = input_53_gamma_0_to_fp16, x = inputs_21_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor q_pad_type_0 = const()[name = tensor("q_pad_type_0"), val = tensor("valid")]; tensor q_strides_0 = const()[name = tensor("q_strides_0"), val = tensor([1, 1])]; tensor q_pad_0 = const()[name = tensor("q_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_dilations_0 = const()[name = tensor("q_dilations_0"), val = tensor([1, 1])]; tensor q_groups_0 = const()[name = tensor("q_groups_0"), val = tensor(1)]; tensor var_988_weight_0_to_fp16 = const()[name = tensor("op_988_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34882752)))]; tensor var_988_bias_0_to_fp16 = const()[name = tensor("op_988_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35407104)))]; tensor var_988_cast_fp16 = conv(bias = var_988_bias_0_to_fp16, dilations = q_dilations_0, groups = q_groups_0, pad = q_pad_0, pad_type = q_pad_type_0, strides = q_strides_0, weight = var_988_weight_0_to_fp16, x = input_53_cast_fp16)[name = tensor("op_988_cast_fp16")]; tensor k_pad_type_0 = const()[name = tensor("k_pad_type_0"), val = tensor("valid")]; tensor k_strides_0 = const()[name = tensor("k_strides_0"), val = tensor([1, 1])]; tensor k_pad_0 = const()[name = tensor("k_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_dilations_0 = const()[name = tensor("k_dilations_0"), val = tensor([1, 1])]; tensor k_groups_0 = const()[name = tensor("k_groups_0"), val = tensor(1)]; tensor blocks_5_attn_key_weight_to_fp16 = const()[name = tensor("blocks_5_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35408192)))]; tensor k_cast_fp16 = conv(dilations = k_dilations_0, groups = k_groups_0, pad = k_pad_0, pad_type = k_pad_type_0, strides = k_strides_0, weight = blocks_5_attn_key_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("k_cast_fp16")]; tensor var_986_pad_type_0 = const()[name = tensor("op_986_pad_type_0"), val = tensor("valid")]; tensor var_986_strides_0 = const()[name = tensor("op_986_strides_0"), val = tensor([1, 1])]; tensor var_986_pad_0 = const()[name = tensor("op_986_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_986_dilations_0 = const()[name = tensor("op_986_dilations_0"), val = tensor([1, 1])]; tensor var_986_groups_0 = const()[name = tensor("op_986_groups_0"), val = tensor(1)]; tensor blocks_5_attn_value_weight_to_fp16 = const()[name = tensor("blocks_5_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35932544)))]; tensor blocks_5_attn_value_bias_to_fp16 = const()[name = tensor("blocks_5_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36456896)))]; tensor var_986_cast_fp16 = conv(bias = blocks_5_attn_value_bias_to_fp16, dilations = var_986_dilations_0, groups = var_986_groups_0, pad = var_986_pad_0, pad_type = var_986_pad_type_0, strides = var_986_strides_0, weight = blocks_5_attn_value_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("op_986_cast_fp16")]; tensor tile_15 = const()[name = tensor("tile_15"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_989_axis_0 = const()[name = tensor("op_989_axis_0"), val = tensor(1)]; tensor var_989_cast_fp16_0, tensor var_989_cast_fp16_1, tensor var_989_cast_fp16_2, tensor var_989_cast_fp16_3, tensor var_989_cast_fp16_4, tensor var_989_cast_fp16_5, tensor var_989_cast_fp16_6, tensor var_989_cast_fp16_7 = split(axis = var_989_axis_0, split_sizes = tile_15, x = var_988_cast_fp16)[name = tensor("op_989_cast_fp16")]; tensor var_998_perm_0 = const()[name = tensor("op_998_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_16 = const()[name = tensor("tile_16"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_999_axis_0 = const()[name = tensor("op_999_axis_0"), val = tensor(3)]; tensor var_998_cast_fp16 = transpose(perm = var_998_perm_0, x = k_cast_fp16)[name = tensor("transpose_1")]; tensor var_999_cast_fp16_0, tensor var_999_cast_fp16_1, tensor var_999_cast_fp16_2, tensor var_999_cast_fp16_3, tensor var_999_cast_fp16_4, tensor var_999_cast_fp16_5, tensor var_999_cast_fp16_6, tensor var_999_cast_fp16_7 = split(axis = var_999_axis_0, split_sizes = tile_16, x = var_998_cast_fp16)[name = tensor("op_999_cast_fp16")]; tensor tile_17 = const()[name = tensor("tile_17"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1008_axis_0 = const()[name = tensor("op_1008_axis_0"), val = tensor(1)]; tensor var_1008_cast_fp16_0, tensor var_1008_cast_fp16_1, tensor var_1008_cast_fp16_2, tensor var_1008_cast_fp16_3, tensor var_1008_cast_fp16_4, tensor var_1008_cast_fp16_5, tensor var_1008_cast_fp16_6, tensor var_1008_cast_fp16_7 = split(axis = var_1008_axis_0, split_sizes = tile_17, x = var_986_cast_fp16)[name = tensor("op_1008_cast_fp16")]; tensor aw_81_equation_0 = const()[name = tensor("aw_81_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_81_cast_fp16 = einsum(equation = aw_81_equation_0, values = (var_999_cast_fp16_0, var_989_cast_fp16_0))[name = tensor("aw_81_cast_fp16")]; tensor aw_83_equation_0 = const()[name = tensor("aw_83_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_83_cast_fp16 = einsum(equation = aw_83_equation_0, values = (var_999_cast_fp16_1, var_989_cast_fp16_1))[name = tensor("aw_83_cast_fp16")]; tensor aw_85_equation_0 = const()[name = tensor("aw_85_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_85_cast_fp16 = einsum(equation = aw_85_equation_0, values = (var_999_cast_fp16_2, var_989_cast_fp16_2))[name = tensor("aw_85_cast_fp16")]; tensor aw_87_equation_0 = const()[name = tensor("aw_87_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_87_cast_fp16 = einsum(equation = aw_87_equation_0, values = (var_999_cast_fp16_3, var_989_cast_fp16_3))[name = tensor("aw_87_cast_fp16")]; tensor aw_89_equation_0 = const()[name = tensor("aw_89_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_89_cast_fp16 = einsum(equation = aw_89_equation_0, values = (var_999_cast_fp16_4, var_989_cast_fp16_4))[name = tensor("aw_89_cast_fp16")]; tensor aw_91_equation_0 = const()[name = tensor("aw_91_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_91_cast_fp16 = einsum(equation = aw_91_equation_0, values = (var_999_cast_fp16_5, var_989_cast_fp16_5))[name = tensor("aw_91_cast_fp16")]; tensor aw_93_equation_0 = const()[name = tensor("aw_93_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_93_cast_fp16 = einsum(equation = aw_93_equation_0, values = (var_999_cast_fp16_6, var_989_cast_fp16_6))[name = tensor("aw_93_cast_fp16")]; tensor aw_equation_0 = const()[name = tensor("aw_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_cast_fp16 = einsum(equation = aw_equation_0, values = (var_999_cast_fp16_7, var_989_cast_fp16_7))[name = tensor("aw_cast_fp16")]; tensor var_1033_cast_fp16 = softmax(axis = var_937, x = aw_81_cast_fp16)[name = tensor("op_1033_cast_fp16")]; tensor var_1034_cast_fp16 = softmax(axis = var_937, x = aw_83_cast_fp16)[name = tensor("op_1034_cast_fp16")]; tensor var_1035_cast_fp16 = softmax(axis = var_937, x = aw_85_cast_fp16)[name = tensor("op_1035_cast_fp16")]; tensor var_1036_cast_fp16 = softmax(axis = var_937, x = aw_87_cast_fp16)[name = tensor("op_1036_cast_fp16")]; tensor var_1037_cast_fp16 = softmax(axis = var_937, x = aw_89_cast_fp16)[name = tensor("op_1037_cast_fp16")]; tensor var_1038_cast_fp16 = softmax(axis = var_937, x = aw_91_cast_fp16)[name = tensor("op_1038_cast_fp16")]; tensor var_1039_cast_fp16 = softmax(axis = var_937, x = aw_93_cast_fp16)[name = tensor("op_1039_cast_fp16")]; tensor var_1040_cast_fp16 = softmax(axis = var_937, x = aw_cast_fp16)[name = tensor("op_1040_cast_fp16")]; tensor var_1042_equation_0 = const()[name = tensor("op_1042_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1042_cast_fp16 = einsum(equation = var_1042_equation_0, values = (var_1008_cast_fp16_0, var_1033_cast_fp16))[name = tensor("op_1042_cast_fp16")]; tensor var_1044_equation_0 = const()[name = tensor("op_1044_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1044_cast_fp16 = einsum(equation = var_1044_equation_0, values = (var_1008_cast_fp16_1, var_1034_cast_fp16))[name = tensor("op_1044_cast_fp16")]; tensor var_1046_equation_0 = const()[name = tensor("op_1046_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1046_cast_fp16 = einsum(equation = var_1046_equation_0, values = (var_1008_cast_fp16_2, var_1035_cast_fp16))[name = tensor("op_1046_cast_fp16")]; tensor var_1048_equation_0 = const()[name = tensor("op_1048_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1048_cast_fp16 = einsum(equation = var_1048_equation_0, values = (var_1008_cast_fp16_3, var_1036_cast_fp16))[name = tensor("op_1048_cast_fp16")]; tensor var_1050_equation_0 = const()[name = tensor("op_1050_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1050_cast_fp16 = einsum(equation = var_1050_equation_0, values = (var_1008_cast_fp16_4, var_1037_cast_fp16))[name = tensor("op_1050_cast_fp16")]; tensor var_1052_equation_0 = const()[name = tensor("op_1052_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1052_cast_fp16 = einsum(equation = var_1052_equation_0, values = (var_1008_cast_fp16_5, var_1038_cast_fp16))[name = tensor("op_1052_cast_fp16")]; tensor var_1054_equation_0 = const()[name = tensor("op_1054_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1054_cast_fp16 = einsum(equation = var_1054_equation_0, values = (var_1008_cast_fp16_6, var_1039_cast_fp16))[name = tensor("op_1054_cast_fp16")]; tensor var_1056_equation_0 = const()[name = tensor("op_1056_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1056_cast_fp16 = einsum(equation = var_1056_equation_0, values = (var_1008_cast_fp16_7, var_1040_cast_fp16))[name = tensor("op_1056_cast_fp16")]; tensor input_55_interleave_0 = const()[name = tensor("input_55_interleave_0"), val = tensor(false)]; tensor input_55_cast_fp16 = concat(axis = var_937, interleave = input_55_interleave_0, values = (var_1042_cast_fp16, var_1044_cast_fp16, var_1046_cast_fp16, var_1048_cast_fp16, var_1050_cast_fp16, var_1052_cast_fp16, var_1054_cast_fp16, var_1056_cast_fp16))[name = tensor("input_55_cast_fp16")]; tensor var_1065_pad_type_0 = const()[name = tensor("op_1065_pad_type_0"), val = tensor("valid")]; tensor var_1065_strides_0 = const()[name = tensor("op_1065_strides_0"), val = tensor([1, 1])]; tensor var_1065_pad_0 = const()[name = tensor("op_1065_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1065_dilations_0 = const()[name = tensor("op_1065_dilations_0"), val = tensor([1, 1])]; tensor var_1065_groups_0 = const()[name = tensor("op_1065_groups_0"), val = tensor(1)]; tensor blocks_5_attn_out_weight_to_fp16 = const()[name = tensor("blocks_5_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36457984)))]; tensor blocks_5_attn_out_bias_to_fp16 = const()[name = tensor("blocks_5_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36982336)))]; tensor var_1065_cast_fp16 = conv(bias = blocks_5_attn_out_bias_to_fp16, dilations = var_1065_dilations_0, groups = var_1065_groups_0, pad = var_1065_pad_0, pad_type = var_1065_pad_type_0, strides = var_1065_strides_0, weight = blocks_5_attn_out_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("op_1065_cast_fp16")]; tensor inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = var_1065_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; tensor input_57_axes_0 = const()[name = tensor("input_57_axes_0"), val = tensor([1])]; tensor input_57_gamma_0_to_fp16 = const()[name = tensor("input_57_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36983424)))]; tensor input_57_beta_0_to_fp16 = const()[name = tensor("input_57_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36984512)))]; tensor var_1075_to_fp16 = const()[name = tensor("op_1075_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_57_cast_fp16 = layer_norm(axes = input_57_axes_0, beta = input_57_beta_0_to_fp16, epsilon = var_1075_to_fp16, gamma = input_57_gamma_0_to_fp16, x = inputs_23_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor input_59_pad_type_0 = const()[name = tensor("input_59_pad_type_0"), val = tensor("valid")]; tensor input_59_strides_0 = const()[name = tensor("input_59_strides_0"), val = tensor([1, 1])]; tensor input_59_pad_0 = const()[name = tensor("input_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_59_dilations_0 = const()[name = tensor("input_59_dilations_0"), val = tensor([1, 1])]; tensor input_59_groups_0 = const()[name = tensor("input_59_groups_0"), val = tensor(1)]; tensor blocks_5_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36985600)))]; tensor blocks_5_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39082816)))]; tensor input_59_cast_fp16 = conv(bias = blocks_5_mlp_0_bias_to_fp16, dilations = input_59_dilations_0, groups = input_59_groups_0, pad = input_59_pad_0, pad_type = input_59_pad_type_0, strides = input_59_strides_0, weight = blocks_5_mlp_0_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = input_59_cast_fp16)[name = tensor("input_cast_fp16")]; tensor var_1101_pad_type_0 = const()[name = tensor("op_1101_pad_type_0"), val = tensor("valid")]; tensor var_1101_strides_0 = const()[name = tensor("op_1101_strides_0"), val = tensor([1, 1])]; tensor var_1101_pad_0 = const()[name = tensor("op_1101_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1101_dilations_0 = const()[name = tensor("op_1101_dilations_0"), val = tensor([1, 1])]; tensor var_1101_groups_0 = const()[name = tensor("op_1101_groups_0"), val = tensor(1)]; tensor blocks_5_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39086976)))]; tensor blocks_5_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41184192)))]; tensor var_1101_cast_fp16 = conv(bias = blocks_5_mlp_2_bias_to_fp16, dilations = var_1101_dilations_0, groups = var_1101_groups_0, pad = var_1101_pad_0, pad_type = var_1101_pad_type_0, strides = var_1101_strides_0, weight = blocks_5_mlp_2_weight_to_fp16, x = input_cast_fp16)[name = tensor("op_1101_cast_fp16")]; tensor inputs_cast_fp16 = add(x = inputs_23_cast_fp16, y = var_1101_cast_fp16)[name = tensor("inputs_cast_fp16")]; tensor x_axes_0 = const()[name = tensor("x_axes_0"), val = tensor([1])]; tensor x_gamma_0_to_fp16 = const()[name = tensor("x_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41185280)))]; tensor x_beta_0_to_fp16 = const()[name = tensor("x_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41186368)))]; tensor var_1115_to_fp16 = const()[name = tensor("op_1115_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_cast_fp16 = layer_norm(axes = x_axes_0, beta = x_beta_0_to_fp16, epsilon = var_1115_to_fp16, gamma = x_gamma_0_to_fp16, x = inputs_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_1126_axes_0 = const()[name = tensor("op_1126_axes_0"), val = tensor([2])]; tensor var_1126_cast_fp16 = squeeze(axes = var_1126_axes_0, x = x_cast_fp16)[name = tensor("op_1126_cast_fp16")]; tensor var_1129_perm_0 = const()[name = tensor("op_1129_perm_0"), val = tensor([0, 2, 1])]; tensor var_1129_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_1129_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_1129_cast_fp16 = transpose(perm = var_1129_perm_0, x = var_1126_cast_fp16)[name = tensor("transpose_0")]; tensor output = cast(dtype = var_1129_cast_fp16_to_fp32_dtype_0, x = var_1129_cast_fp16)[name = tensor("cast_27")]; } -> (output); }