program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}, {"coremltools-component-torch", "2.10.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor audio_embed, tensor encoder_mask, tensor encoder_output) { tensor cast_94_dtype_0 = const()[name = tensor("cast_94_dtype_0"), val = tensor("bool")]; tensor cast_94 = cast(dtype = cast_94_dtype_0, x = encoder_mask)[name = tensor("cast_94")]; tensor var_40_to_fp16 = const()[name = tensor("op_40_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor input_3_cast_fp16 = add(x = audio_embed, y = var_40_to_fp16)[name = tensor("input_3_cast_fp16")]; tensor var_54 = const()[name = tensor("op_54"), val = tensor(-1)]; tensor x_1_axes_0 = const()[name = tensor("x_1_axes_0"), val = tensor([-1])]; tensor layers_0_norm_sa_weight_to_fp16 = const()[name = tensor("layers_0_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169088)))]; tensor var_61_to_fp16 = const()[name = tensor("op_61_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_1_cast_fp16 = layer_norm(axes = x_1_axes_0, epsilon = var_61_to_fp16, gamma = layers_0_norm_sa_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("x_1_cast_fp16")]; tensor layers_0_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170688)))]; tensor linear_0_bias_0_to_fp16 = const()[name = tensor("linear_0_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3709696)))]; tensor linear_0_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_0_self_attn_qkv_proj_weight_to_fp16, x = x_1_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_79 = const()[name = tensor("op_79"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_1_cast_fp16 = reshape(shape = var_79, x = linear_0_cast_fp16)[name = tensor("qkv_1_cast_fp16")]; tensor q_1_begin_0 = const()[name = tensor("q_1_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_1_end_0 = const()[name = tensor("q_1_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_1_end_mask_0 = const()[name = tensor("q_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_1_squeeze_mask_0 = const()[name = tensor("q_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_1_cast_fp16 = slice_by_index(begin = q_1_begin_0, end = q_1_end_0, end_mask = q_1_end_mask_0, squeeze_mask = q_1_squeeze_mask_0, x = qkv_1_cast_fp16)[name = tensor("q_1_cast_fp16")]; tensor k_1_begin_0 = const()[name = tensor("k_1_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_1_end_0 = const()[name = tensor("k_1_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_1_end_mask_0 = const()[name = tensor("k_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_1_squeeze_mask_0 = const()[name = tensor("k_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_1_cast_fp16 = slice_by_index(begin = k_1_begin_0, end = k_1_end_0, end_mask = k_1_end_mask_0, squeeze_mask = k_1_squeeze_mask_0, x = qkv_1_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor v_1_begin_0 = const()[name = tensor("v_1_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_1_end_0 = const()[name = tensor("v_1_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_1_end_mask_0 = const()[name = tensor("v_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_1_squeeze_mask_0 = const()[name = tensor("v_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_1_cast_fp16 = slice_by_index(begin = v_1_begin_0, end = v_1_end_0, end_mask = v_1_end_mask_0, squeeze_mask = v_1_squeeze_mask_0, x = qkv_1_cast_fp16)[name = tensor("v_1_cast_fp16")]; tensor v_t_1_perm_0 = const()[name = tensor("v_t_1_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_94_transpose_x_0 = const()[name = tensor("op_94_transpose_x_0"), val = tensor(false)]; tensor var_94_transpose_y_0 = const()[name = tensor("op_94_transpose_y_0"), val = tensor(false)]; tensor transpose_66_perm_0 = const()[name = tensor("transpose_66_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_67_perm_0 = const()[name = tensor("transpose_67_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_67 = transpose(perm = transpose_67_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_217")]; tensor transpose_66 = transpose(perm = transpose_66_perm_0, x = q_1_cast_fp16)[name = tensor("transpose_218")]; tensor var_94_cast_fp16 = matmul(transpose_x = var_94_transpose_x_0, transpose_y = var_94_transpose_y_0, x = transpose_66, y = transpose_67)[name = tensor("op_94_cast_fp16")]; tensor var_95_to_fp16 = const()[name = tensor("op_95_to_fp16"), val = tensor(0x1p-3)]; tensor attn_1_cast_fp16 = mul(x = var_94_cast_fp16, y = var_95_to_fp16)[name = tensor("attn_1_cast_fp16")]; tensor attn_1_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_1_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_102 = const()[name = tensor("op_102"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3714368)))]; tensor attn_1_cast_fp16_to_fp32 = cast(dtype = attn_1_cast_fp16_to_fp32_dtype_0, x = attn_1_cast_fp16)[name = tensor("cast_93")]; tensor input_5 = add(x = attn_1_cast_fp16_to_fp32, y = var_102)[name = tensor("input_5")]; tensor input_5_to_fp16_dtype_0 = const()[name = tensor("input_5_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_5_to_fp16 = cast(dtype = input_5_to_fp16_dtype_0, x = input_5)[name = tensor("cast_92")]; tensor attn_3_cast_fp16 = softmax(axis = var_54, x = input_5_to_fp16)[name = tensor("attn_3_cast_fp16")]; tensor out_1_transpose_x_0 = const()[name = tensor("out_1_transpose_x_0"), val = tensor(false)]; tensor out_1_transpose_y_0 = const()[name = tensor("out_1_transpose_y_0"), val = tensor(false)]; tensor v_t_1_cast_fp16 = transpose(perm = v_t_1_perm_0, x = v_1_cast_fp16)[name = tensor("transpose_219")]; tensor out_1_cast_fp16 = matmul(transpose_x = out_1_transpose_x_0, transpose_y = out_1_transpose_y_0, x = attn_3_cast_fp16, y = v_t_1_cast_fp16)[name = tensor("out_1_cast_fp16")]; tensor var_106_perm_0 = const()[name = tensor("op_106_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_107 = const()[name = tensor("op_107"), val = tensor([1, 110, -1])]; tensor var_106_cast_fp16 = transpose(perm = var_106_perm_0, x = out_1_cast_fp16)[name = tensor("transpose_216")]; tensor input_7_cast_fp16 = reshape(shape = var_107, x = var_106_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor layers_0_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3762880)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4942592)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_0_self_attn_o_proj_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor input_9_cast_fp16 = add(x = input_3_cast_fp16, y = linear_1_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor x_3_axes_0 = const()[name = tensor("x_3_axes_0"), val = tensor([-1])]; tensor layers_0_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_0_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4944192)))]; tensor x_3_cast_fp16 = layer_norm(axes = x_3_axes_0, epsilon = var_61_to_fp16, gamma = layers_0_norm_xa_query_weight_to_fp16, x = input_9_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor memory_1_axes_0 = const()[name = tensor("memory_1_axes_0"), val = tensor([-1])]; tensor layers_0_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_0_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4945792)))]; tensor memory_1_cast_fp16 = layer_norm(axes = memory_1_axes_0, epsilon = var_61_to_fp16, gamma = layers_0_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_1_cast_fp16")]; tensor layers_0_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_0_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4947392)))]; tensor linear_2_bias_0_to_fp16 = const()[name = tensor("linear_2_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5144064)))]; tensor linear_2_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_0_cross_attn_q_proj_weight_to_fp16, x = x_3_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_130 = const()[name = tensor("op_130"), val = tensor([1, 110, 1, 128])]; tensor var_131_cast_fp16 = reshape(shape = var_130, x = linear_2_cast_fp16)[name = tensor("op_131_cast_fp16")]; tensor layers_0_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_0_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5144384)))]; tensor linear_3_bias_0_to_fp16 = const()[name = tensor("linear_3_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5537664)))]; tensor linear_3_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_0_cross_attn_kv_proj_weight_to_fp16, x = memory_1_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor var_135 = const()[name = tensor("op_135"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_1_cast_fp16 = reshape(shape = var_135, x = linear_3_cast_fp16)[name = tensor("kv_1_cast_fp16")]; tensor var_139_begin_0 = const()[name = tensor("op_139_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_139_end_0 = const()[name = tensor("op_139_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_139_end_mask_0 = const()[name = tensor("op_139_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_139_squeeze_mask_0 = const()[name = tensor("op_139_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_139_cast_fp16 = slice_by_index(begin = var_139_begin_0, end = var_139_end_0, end_mask = var_139_end_mask_0, squeeze_mask = var_139_squeeze_mask_0, x = kv_1_cast_fp16)[name = tensor("op_139_cast_fp16")]; tensor var_143_begin_0 = const()[name = tensor("op_143_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_143_end_0 = const()[name = tensor("op_143_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_143_end_mask_0 = const()[name = tensor("op_143_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_143_squeeze_mask_0 = const()[name = tensor("op_143_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_143_cast_fp16 = slice_by_index(begin = var_143_begin_0, end = var_143_end_0, end_mask = var_143_end_mask_0, squeeze_mask = var_143_squeeze_mask_0, x = kv_1_cast_fp16)[name = tensor("op_143_cast_fp16")]; tensor v_3_perm_0 = const()[name = tensor("v_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_146_transpose_x_0 = const()[name = tensor("op_146_transpose_x_0"), val = tensor(false)]; tensor var_146_transpose_y_0 = const()[name = tensor("op_146_transpose_y_0"), val = tensor(false)]; tensor transpose_68_perm_0 = const()[name = tensor("transpose_68_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_69_perm_0 = const()[name = tensor("transpose_69_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_69 = transpose(perm = transpose_69_perm_0, x = var_139_cast_fp16)[name = tensor("transpose_213")]; tensor transpose_68 = transpose(perm = transpose_68_perm_0, x = var_131_cast_fp16)[name = tensor("transpose_214")]; tensor var_146_cast_fp16 = matmul(transpose_x = var_146_transpose_x_0, transpose_y = var_146_transpose_y_0, x = transpose_68, y = transpose_69)[name = tensor("op_146_cast_fp16")]; tensor var_147_to_fp16 = const()[name = tensor("op_147_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_5_cast_fp16 = mul(x = var_146_cast_fp16, y = var_147_to_fp16)[name = tensor("attn_5_cast_fp16")]; tensor var_149_axes_0 = const()[name = tensor("op_149_axes_0"), val = tensor([1])]; tensor var_149 = expand_dims(axes = var_149_axes_0, x = cast_94)[name = tensor("op_149")]; tensor attn_mask_1_axes_0 = const()[name = tensor("attn_mask_1_axes_0"), val = tensor([2])]; tensor attn_mask_1 = expand_dims(axes = attn_mask_1_axes_0, x = var_149)[name = tensor("attn_mask_1")]; tensor var_151 = logical_not(x = attn_mask_1)[name = tensor("op_151")]; tensor var_45_to_fp16 = const()[name = tensor("op_45_to_fp16"), val = tensor(-inf)]; tensor input_11_cast_fp16 = select(a = var_45_to_fp16, b = attn_5_cast_fp16, cond = var_151)[name = tensor("input_11_cast_fp16")]; tensor attn_7_cast_fp16 = softmax(axis = var_54, x = input_11_cast_fp16)[name = tensor("attn_7_cast_fp16")]; tensor out_3_transpose_x_0 = const()[name = tensor("out_3_transpose_x_0"), val = tensor(false)]; tensor out_3_transpose_y_0 = const()[name = tensor("out_3_transpose_y_0"), val = tensor(false)]; tensor v_3_cast_fp16 = transpose(perm = v_3_perm_0, x = var_143_cast_fp16)[name = tensor("transpose_215")]; tensor out_3_cast_fp16 = matmul(transpose_x = out_3_transpose_x_0, transpose_y = out_3_transpose_y_0, x = attn_7_cast_fp16, y = v_3_cast_fp16)[name = tensor("out_3_cast_fp16")]; tensor var_155_perm_0 = const()[name = tensor("op_155_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_156 = const()[name = tensor("op_156"), val = tensor([1, 110, -1])]; tensor var_155_cast_fp16 = transpose(perm = var_155_perm_0, x = out_3_cast_fp16)[name = tensor("transpose_212")]; tensor input_13_cast_fp16 = reshape(shape = var_156, x = var_155_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor layers_0_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_0_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5538240)))]; tensor linear_4_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_0_cross_attn_o_proj_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor input_15_cast_fp16 = add(x = input_9_cast_fp16, y = linear_4_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor x_5_axes_0 = const()[name = tensor("x_5_axes_0"), val = tensor([-1])]; tensor layers_0_norm_ff_weight_to_fp16 = const()[name = tensor("layers_0_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5734912)))]; tensor x_5_cast_fp16 = layer_norm(axes = x_5_axes_0, epsilon = var_61_to_fp16, gamma = layers_0_norm_ff_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("x_5_cast_fp16")]; tensor input_17_perm_0 = const()[name = tensor("input_17_perm_0"), val = tensor([0, 2, 1])]; tensor input_19_pad_type_0 = const()[name = tensor("input_19_pad_type_0"), val = tensor("valid")]; tensor input_19_strides_0 = const()[name = tensor("input_19_strides_0"), val = tensor([1])]; tensor input_19_pad_0 = const()[name = tensor("input_19_pad_0"), val = tensor([0, 0])]; tensor input_19_dilations_0 = const()[name = tensor("input_19_dilations_0"), val = tensor([1])]; tensor input_19_groups_0 = const()[name = tensor("input_19_groups_0"), val = tensor(1)]; tensor layers_0_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_0_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5736512)))]; tensor input_17_cast_fp16 = transpose(perm = input_17_perm_0, x = x_5_cast_fp16)[name = tensor("transpose_211")]; tensor input_19_cast_fp16 = conv(dilations = input_19_dilations_0, groups = input_19_groups_0, pad = input_19_pad_0, pad_type = input_19_pad_type_0, strides = input_19_strides_0, weight = layers_0_ffn_conv1_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_21_cast_fp16 = gelu(mode = input_21_mode_0, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor x_7_pad_type_0 = const()[name = tensor("x_7_pad_type_0"), val = tensor("valid")]; tensor x_7_strides_0 = const()[name = tensor("x_7_strides_0"), val = tensor([1])]; tensor x_7_pad_0 = const()[name = tensor("x_7_pad_0"), val = tensor([0, 0])]; tensor x_7_dilations_0 = const()[name = tensor("x_7_dilations_0"), val = tensor([1])]; tensor x_7_groups_0 = const()[name = tensor("x_7_groups_0"), val = tensor(1)]; tensor layers_0_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_0_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10455168)))]; tensor x_7_cast_fp16 = conv(dilations = x_7_dilations_0, groups = x_7_groups_0, pad = x_7_pad_0, pad_type = x_7_pad_type_0, strides = x_7_strides_0, weight = layers_0_ffn_conv2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("x_7_cast_fp16")]; tensor x_9_perm_0 = const()[name = tensor("x_9_perm_0"), val = tensor([0, 2, 1])]; tensor x_9_cast_fp16 = transpose(perm = x_9_perm_0, x = x_7_cast_fp16)[name = tensor("transpose_210")]; tensor input_23_cast_fp16 = add(x = input_15_cast_fp16, y = x_9_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor k_padded_1_pad_0 = const()[name = tensor("k_padded_1_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_1_mode_0 = const()[name = tensor("k_padded_1_mode_0"), val = tensor("constant")]; tensor const_7_to_fp16 = const()[name = tensor("const_7_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_1_cast_fp16 = pad(constant_val = const_7_to_fp16, mode = k_padded_1_mode_0, pad = k_padded_1_pad_0, x = k_1_cast_fp16)[name = tensor("k_padded_1_cast_fp16")]; tensor v_padded_1_pad_0 = const()[name = tensor("v_padded_1_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_1_mode_0 = const()[name = tensor("v_padded_1_mode_0"), val = tensor("constant")]; tensor const_8_to_fp16 = const()[name = tensor("const_8_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_1_cast_fp16 = pad(constant_val = const_8_to_fp16, mode = v_padded_1_mode_0, pad = v_padded_1_pad_0, x = v_1_cast_fp16)[name = tensor("v_padded_1_cast_fp16")]; tensor var_208_axis_0 = const()[name = tensor("op_208_axis_0"), val = tensor(0)]; tensor var_208 = stack(axis = var_208_axis_0, values = (k_padded_1_cast_fp16, v_padded_1_cast_fp16))[name = tensor("op_208_cast_fp16")]; tensor var_220 = const()[name = tensor("op_220"), val = tensor(-1)]; tensor x_11_axes_0 = const()[name = tensor("x_11_axes_0"), val = tensor([-1])]; tensor layers_1_norm_sa_weight_to_fp16 = const()[name = tensor("layers_1_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15173824)))]; tensor var_227_to_fp16 = const()[name = tensor("op_227_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_11_cast_fp16 = layer_norm(axes = x_11_axes_0, epsilon = var_227_to_fp16, gamma = layers_1_norm_sa_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor layers_1_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_1_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15175424)))]; tensor linear_5_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_1_self_attn_qkv_proj_weight_to_fp16, x = x_11_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_3_cast_fp16 = reshape(shape = var_245, x = linear_5_cast_fp16)[name = tensor("qkv_3_cast_fp16")]; tensor q_7_begin_0 = const()[name = tensor("q_7_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_7_end_0 = const()[name = tensor("q_7_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_7_end_mask_0 = const()[name = tensor("q_7_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_7_squeeze_mask_0 = const()[name = tensor("q_7_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_7_cast_fp16 = slice_by_index(begin = q_7_begin_0, end = q_7_end_0, end_mask = q_7_end_mask_0, squeeze_mask = q_7_squeeze_mask_0, x = qkv_3_cast_fp16)[name = tensor("q_7_cast_fp16")]; tensor k_5_begin_0 = const()[name = tensor("k_5_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_5_end_0 = const()[name = tensor("k_5_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_5_end_mask_0 = const()[name = tensor("k_5_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_5_squeeze_mask_0 = const()[name = tensor("k_5_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_5_cast_fp16 = slice_by_index(begin = k_5_begin_0, end = k_5_end_0, end_mask = k_5_end_mask_0, squeeze_mask = k_5_squeeze_mask_0, x = qkv_3_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor v_5_begin_0 = const()[name = tensor("v_5_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_5_end_0 = const()[name = tensor("v_5_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_5_end_mask_0 = const()[name = tensor("v_5_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_5_squeeze_mask_0 = const()[name = tensor("v_5_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_5_cast_fp16 = slice_by_index(begin = v_5_begin_0, end = v_5_end_0, end_mask = v_5_end_mask_0, squeeze_mask = v_5_squeeze_mask_0, x = qkv_3_cast_fp16)[name = tensor("v_5_cast_fp16")]; tensor v_t_3_perm_0 = const()[name = tensor("v_t_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_260_transpose_x_0 = const()[name = tensor("op_260_transpose_x_0"), val = tensor(false)]; tensor var_260_transpose_y_0 = const()[name = tensor("op_260_transpose_y_0"), val = tensor(false)]; tensor transpose_70_perm_0 = const()[name = tensor("transpose_70_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_71_perm_0 = const()[name = tensor("transpose_71_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_71 = transpose(perm = transpose_71_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_207")]; tensor transpose_70 = transpose(perm = transpose_70_perm_0, x = q_7_cast_fp16)[name = tensor("transpose_208")]; tensor var_260_cast_fp16 = matmul(transpose_x = var_260_transpose_x_0, transpose_y = var_260_transpose_y_0, x = transpose_70, y = transpose_71)[name = tensor("op_260_cast_fp16")]; tensor var_261_to_fp16 = const()[name = tensor("op_261_to_fp16"), val = tensor(0x1p-3)]; tensor attn_9_cast_fp16 = mul(x = var_260_cast_fp16, y = var_261_to_fp16)[name = tensor("attn_9_cast_fp16")]; tensor attn_9_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_9_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_9_cast_fp16_to_fp32 = cast(dtype = attn_9_cast_fp16_to_fp32_dtype_0, x = attn_9_cast_fp16)[name = tensor("cast_91")]; tensor input_25 = add(x = attn_9_cast_fp16_to_fp32, y = var_102)[name = tensor("input_25")]; tensor input_25_to_fp16_dtype_0 = const()[name = tensor("input_25_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_25_to_fp16 = cast(dtype = input_25_to_fp16_dtype_0, x = input_25)[name = tensor("cast_90")]; tensor attn_11_cast_fp16 = softmax(axis = var_220, x = input_25_to_fp16)[name = tensor("attn_11_cast_fp16")]; tensor out_5_transpose_x_0 = const()[name = tensor("out_5_transpose_x_0"), val = tensor(false)]; tensor out_5_transpose_y_0 = const()[name = tensor("out_5_transpose_y_0"), val = tensor(false)]; tensor v_t_3_cast_fp16 = transpose(perm = v_t_3_perm_0, x = v_5_cast_fp16)[name = tensor("transpose_209")]; tensor out_5_cast_fp16 = matmul(transpose_x = out_5_transpose_x_0, transpose_y = out_5_transpose_y_0, x = attn_11_cast_fp16, y = v_t_3_cast_fp16)[name = tensor("out_5_cast_fp16")]; tensor var_272_perm_0 = const()[name = tensor("op_272_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_273 = const()[name = tensor("op_273"), val = tensor([1, 110, -1])]; tensor var_272_cast_fp16 = transpose(perm = var_272_perm_0, x = out_5_cast_fp16)[name = tensor("transpose_206")]; tensor input_27_cast_fp16 = reshape(shape = var_273, x = var_272_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor layers_1_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_1_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18714432)))]; tensor linear_6_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_1_self_attn_o_proj_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor input_29_cast_fp16 = add(x = input_23_cast_fp16, y = linear_6_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor x_13_axes_0 = const()[name = tensor("x_13_axes_0"), val = tensor([-1])]; tensor layers_1_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_1_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19894144)))]; tensor x_13_cast_fp16 = layer_norm(axes = x_13_axes_0, epsilon = var_227_to_fp16, gamma = layers_1_norm_xa_query_weight_to_fp16, x = input_29_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor memory_3_axes_0 = const()[name = tensor("memory_3_axes_0"), val = tensor([-1])]; tensor layers_1_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_1_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19895744)))]; tensor memory_3_cast_fp16 = layer_norm(axes = memory_3_axes_0, epsilon = var_227_to_fp16, gamma = layers_1_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_3_cast_fp16")]; tensor layers_1_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_1_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19897344)))]; tensor linear_7_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_1_cross_attn_q_proj_weight_to_fp16, x = x_13_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_296 = const()[name = tensor("op_296"), val = tensor([1, 110, 1, 128])]; tensor var_297_cast_fp16 = reshape(shape = var_296, x = linear_7_cast_fp16)[name = tensor("op_297_cast_fp16")]; tensor layers_1_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_1_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20094016)))]; tensor linear_8_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_1_cross_attn_kv_proj_weight_to_fp16, x = memory_3_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_301 = const()[name = tensor("op_301"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_3_cast_fp16 = reshape(shape = var_301, x = linear_8_cast_fp16)[name = tensor("kv_3_cast_fp16")]; tensor var_305_begin_0 = const()[name = tensor("op_305_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_305_end_0 = const()[name = tensor("op_305_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_305_end_mask_0 = const()[name = tensor("op_305_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_305_squeeze_mask_0 = const()[name = tensor("op_305_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_305_cast_fp16 = slice_by_index(begin = var_305_begin_0, end = var_305_end_0, end_mask = var_305_end_mask_0, squeeze_mask = var_305_squeeze_mask_0, x = kv_3_cast_fp16)[name = tensor("op_305_cast_fp16")]; tensor var_309_begin_0 = const()[name = tensor("op_309_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_309_end_0 = const()[name = tensor("op_309_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_309_end_mask_0 = const()[name = tensor("op_309_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_309_squeeze_mask_0 = const()[name = tensor("op_309_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_309_cast_fp16 = slice_by_index(begin = var_309_begin_0, end = var_309_end_0, end_mask = var_309_end_mask_0, squeeze_mask = var_309_squeeze_mask_0, x = kv_3_cast_fp16)[name = tensor("op_309_cast_fp16")]; tensor v_7_perm_0 = const()[name = tensor("v_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_312_transpose_x_0 = const()[name = tensor("op_312_transpose_x_0"), val = tensor(false)]; tensor var_312_transpose_y_0 = const()[name = tensor("op_312_transpose_y_0"), val = tensor(false)]; tensor transpose_72_perm_0 = const()[name = tensor("transpose_72_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_73_perm_0 = const()[name = tensor("transpose_73_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_73 = transpose(perm = transpose_73_perm_0, x = var_305_cast_fp16)[name = tensor("transpose_203")]; tensor transpose_72 = transpose(perm = transpose_72_perm_0, x = var_297_cast_fp16)[name = tensor("transpose_204")]; tensor var_312_cast_fp16 = matmul(transpose_x = var_312_transpose_x_0, transpose_y = var_312_transpose_y_0, x = transpose_72, y = transpose_73)[name = tensor("op_312_cast_fp16")]; tensor var_313_to_fp16 = const()[name = tensor("op_313_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_13_cast_fp16 = mul(x = var_312_cast_fp16, y = var_313_to_fp16)[name = tensor("attn_13_cast_fp16")]; tensor var_211_to_fp16 = const()[name = tensor("op_211_to_fp16"), val = tensor(-inf)]; tensor input_31_cast_fp16 = select(a = var_211_to_fp16, b = attn_13_cast_fp16, cond = var_151)[name = tensor("input_31_cast_fp16")]; tensor attn_15_cast_fp16 = softmax(axis = var_220, x = input_31_cast_fp16)[name = tensor("attn_15_cast_fp16")]; tensor out_7_transpose_x_0 = const()[name = tensor("out_7_transpose_x_0"), val = tensor(false)]; tensor out_7_transpose_y_0 = const()[name = tensor("out_7_transpose_y_0"), val = tensor(false)]; tensor v_7_cast_fp16 = transpose(perm = v_7_perm_0, x = var_309_cast_fp16)[name = tensor("transpose_205")]; tensor out_7_cast_fp16 = matmul(transpose_x = out_7_transpose_x_0, transpose_y = out_7_transpose_y_0, x = attn_15_cast_fp16, y = v_7_cast_fp16)[name = tensor("out_7_cast_fp16")]; tensor var_321_perm_0 = const()[name = tensor("op_321_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_322 = const()[name = tensor("op_322"), val = tensor([1, 110, -1])]; tensor var_321_cast_fp16 = transpose(perm = var_321_perm_0, x = out_7_cast_fp16)[name = tensor("transpose_202")]; tensor input_33_cast_fp16 = reshape(shape = var_322, x = var_321_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor layers_1_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_1_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20487296)))]; tensor linear_9_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_1_cross_attn_o_proj_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor input_35_cast_fp16 = add(x = input_29_cast_fp16, y = linear_9_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor x_15_axes_0 = const()[name = tensor("x_15_axes_0"), val = tensor([-1])]; tensor layers_1_norm_ff_weight_to_fp16 = const()[name = tensor("layers_1_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20683968)))]; tensor x_15_cast_fp16 = layer_norm(axes = x_15_axes_0, epsilon = var_227_to_fp16, gamma = layers_1_norm_ff_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("x_15_cast_fp16")]; tensor input_37_perm_0 = const()[name = tensor("input_37_perm_0"), val = tensor([0, 2, 1])]; tensor input_39_pad_type_0 = const()[name = tensor("input_39_pad_type_0"), val = tensor("valid")]; tensor input_39_strides_0 = const()[name = tensor("input_39_strides_0"), val = tensor([1])]; tensor input_39_pad_0 = const()[name = tensor("input_39_pad_0"), val = tensor([0, 0])]; tensor input_39_dilations_0 = const()[name = tensor("input_39_dilations_0"), val = tensor([1])]; tensor input_39_groups_0 = const()[name = tensor("input_39_groups_0"), val = tensor(1)]; tensor layers_1_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_1_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20685568)))]; tensor input_37_cast_fp16 = transpose(perm = input_37_perm_0, x = x_15_cast_fp16)[name = tensor("transpose_201")]; tensor input_39_cast_fp16 = conv(dilations = input_39_dilations_0, groups = input_39_groups_0, pad = input_39_pad_0, pad_type = input_39_pad_type_0, strides = input_39_strides_0, weight = layers_1_ffn_conv1_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_41_cast_fp16 = gelu(mode = input_41_mode_0, x = input_39_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor x_17_pad_type_0 = const()[name = tensor("x_17_pad_type_0"), val = tensor("valid")]; tensor x_17_strides_0 = const()[name = tensor("x_17_strides_0"), val = tensor([1])]; tensor x_17_pad_0 = const()[name = tensor("x_17_pad_0"), val = tensor([0, 0])]; tensor x_17_dilations_0 = const()[name = tensor("x_17_dilations_0"), val = tensor([1])]; tensor x_17_groups_0 = const()[name = tensor("x_17_groups_0"), val = tensor(1)]; tensor layers_1_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_1_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25404224)))]; tensor x_17_cast_fp16 = conv(dilations = x_17_dilations_0, groups = x_17_groups_0, pad = x_17_pad_0, pad_type = x_17_pad_type_0, strides = x_17_strides_0, weight = layers_1_ffn_conv2_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor x_19_perm_0 = const()[name = tensor("x_19_perm_0"), val = tensor([0, 2, 1])]; tensor x_19_cast_fp16 = transpose(perm = x_19_perm_0, x = x_17_cast_fp16)[name = tensor("transpose_200")]; tensor input_43_cast_fp16 = add(x = input_35_cast_fp16, y = x_19_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor k_padded_3_pad_0 = const()[name = tensor("k_padded_3_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_3_mode_0 = const()[name = tensor("k_padded_3_mode_0"), val = tensor("constant")]; tensor const_14_to_fp16 = const()[name = tensor("const_14_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_3_cast_fp16 = pad(constant_val = const_14_to_fp16, mode = k_padded_3_mode_0, pad = k_padded_3_pad_0, x = k_5_cast_fp16)[name = tensor("k_padded_3_cast_fp16")]; tensor v_padded_3_pad_0 = const()[name = tensor("v_padded_3_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_3_mode_0 = const()[name = tensor("v_padded_3_mode_0"), val = tensor("constant")]; tensor const_15_to_fp16 = const()[name = tensor("const_15_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_3_cast_fp16 = pad(constant_val = const_15_to_fp16, mode = v_padded_3_mode_0, pad = v_padded_3_pad_0, x = v_5_cast_fp16)[name = tensor("v_padded_3_cast_fp16")]; tensor var_374_axis_0 = const()[name = tensor("op_374_axis_0"), val = tensor(0)]; tensor var_374 = stack(axis = var_374_axis_0, values = (k_padded_3_cast_fp16, v_padded_3_cast_fp16))[name = tensor("op_374_cast_fp16")]; tensor var_386 = const()[name = tensor("op_386"), val = tensor(-1)]; tensor x_21_axes_0 = const()[name = tensor("x_21_axes_0"), val = tensor([-1])]; tensor layers_2_norm_sa_weight_to_fp16 = const()[name = tensor("layers_2_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30122880)))]; tensor var_393_to_fp16 = const()[name = tensor("op_393_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_21_cast_fp16 = layer_norm(axes = x_21_axes_0, epsilon = var_393_to_fp16, gamma = layers_2_norm_sa_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("x_21_cast_fp16")]; tensor layers_2_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_2_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30124480)))]; tensor linear_10_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_2_self_attn_qkv_proj_weight_to_fp16, x = x_21_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor var_411 = const()[name = tensor("op_411"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_5_cast_fp16 = reshape(shape = var_411, x = linear_10_cast_fp16)[name = tensor("qkv_5_cast_fp16")]; tensor q_13_begin_0 = const()[name = tensor("q_13_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_13_end_0 = const()[name = tensor("q_13_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_13_end_mask_0 = const()[name = tensor("q_13_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_13_squeeze_mask_0 = const()[name = tensor("q_13_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_13_cast_fp16 = slice_by_index(begin = q_13_begin_0, end = q_13_end_0, end_mask = q_13_end_mask_0, squeeze_mask = q_13_squeeze_mask_0, x = qkv_5_cast_fp16)[name = tensor("q_13_cast_fp16")]; tensor k_9_begin_0 = const()[name = tensor("k_9_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_9_end_0 = const()[name = tensor("k_9_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_9_end_mask_0 = const()[name = tensor("k_9_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_9_squeeze_mask_0 = const()[name = tensor("k_9_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_9_cast_fp16 = slice_by_index(begin = k_9_begin_0, end = k_9_end_0, end_mask = k_9_end_mask_0, squeeze_mask = k_9_squeeze_mask_0, x = qkv_5_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor v_9_begin_0 = const()[name = tensor("v_9_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_9_end_0 = const()[name = tensor("v_9_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_9_end_mask_0 = const()[name = tensor("v_9_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_9_squeeze_mask_0 = const()[name = tensor("v_9_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_9_cast_fp16 = slice_by_index(begin = v_9_begin_0, end = v_9_end_0, end_mask = v_9_end_mask_0, squeeze_mask = v_9_squeeze_mask_0, x = qkv_5_cast_fp16)[name = tensor("v_9_cast_fp16")]; tensor v_t_5_perm_0 = const()[name = tensor("v_t_5_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_426_transpose_x_0 = const()[name = tensor("op_426_transpose_x_0"), val = tensor(false)]; tensor var_426_transpose_y_0 = const()[name = tensor("op_426_transpose_y_0"), val = tensor(false)]; tensor transpose_74_perm_0 = const()[name = tensor("transpose_74_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_75_perm_0 = const()[name = tensor("transpose_75_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_75 = transpose(perm = transpose_75_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_197")]; tensor transpose_74 = transpose(perm = transpose_74_perm_0, x = q_13_cast_fp16)[name = tensor("transpose_198")]; tensor var_426_cast_fp16 = matmul(transpose_x = var_426_transpose_x_0, transpose_y = var_426_transpose_y_0, x = transpose_74, y = transpose_75)[name = tensor("op_426_cast_fp16")]; tensor var_427_to_fp16 = const()[name = tensor("op_427_to_fp16"), val = tensor(0x1p-3)]; tensor attn_17_cast_fp16 = mul(x = var_426_cast_fp16, y = var_427_to_fp16)[name = tensor("attn_17_cast_fp16")]; tensor attn_17_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_17_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_17_cast_fp16_to_fp32 = cast(dtype = attn_17_cast_fp16_to_fp32_dtype_0, x = attn_17_cast_fp16)[name = tensor("cast_89")]; tensor input_45 = add(x = attn_17_cast_fp16_to_fp32, y = var_102)[name = tensor("input_45")]; tensor input_45_to_fp16_dtype_0 = const()[name = tensor("input_45_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_45_to_fp16 = cast(dtype = input_45_to_fp16_dtype_0, x = input_45)[name = tensor("cast_88")]; tensor attn_19_cast_fp16 = softmax(axis = var_386, x = input_45_to_fp16)[name = tensor("attn_19_cast_fp16")]; tensor out_9_transpose_x_0 = const()[name = tensor("out_9_transpose_x_0"), val = tensor(false)]; tensor out_9_transpose_y_0 = const()[name = tensor("out_9_transpose_y_0"), val = tensor(false)]; tensor v_t_5_cast_fp16 = transpose(perm = v_t_5_perm_0, x = v_9_cast_fp16)[name = tensor("transpose_199")]; tensor out_9_cast_fp16 = matmul(transpose_x = out_9_transpose_x_0, transpose_y = out_9_transpose_y_0, x = attn_19_cast_fp16, y = v_t_5_cast_fp16)[name = tensor("out_9_cast_fp16")]; tensor var_438_perm_0 = const()[name = tensor("op_438_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_439 = const()[name = tensor("op_439"), val = tensor([1, 110, -1])]; tensor var_438_cast_fp16 = transpose(perm = var_438_perm_0, x = out_9_cast_fp16)[name = tensor("transpose_196")]; tensor input_47_cast_fp16 = reshape(shape = var_439, x = var_438_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor layers_2_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_2_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33663488)))]; tensor linear_11_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_2_self_attn_o_proj_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor input_49_cast_fp16 = add(x = input_43_cast_fp16, y = linear_11_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor x_23_axes_0 = const()[name = tensor("x_23_axes_0"), val = tensor([-1])]; tensor layers_2_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_2_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34843200)))]; tensor x_23_cast_fp16 = layer_norm(axes = x_23_axes_0, epsilon = var_393_to_fp16, gamma = layers_2_norm_xa_query_weight_to_fp16, x = input_49_cast_fp16)[name = tensor("x_23_cast_fp16")]; tensor memory_5_axes_0 = const()[name = tensor("memory_5_axes_0"), val = tensor([-1])]; tensor layers_2_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_2_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34844800)))]; tensor memory_5_cast_fp16 = layer_norm(axes = memory_5_axes_0, epsilon = var_393_to_fp16, gamma = layers_2_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_5_cast_fp16")]; tensor layers_2_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_2_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34846400)))]; tensor linear_12_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_2_cross_attn_q_proj_weight_to_fp16, x = x_23_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_462 = const()[name = tensor("op_462"), val = tensor([1, 110, 1, 128])]; tensor var_463_cast_fp16 = reshape(shape = var_462, x = linear_12_cast_fp16)[name = tensor("op_463_cast_fp16")]; tensor layers_2_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_2_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35043072)))]; tensor linear_13_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_2_cross_attn_kv_proj_weight_to_fp16, x = memory_5_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_467 = const()[name = tensor("op_467"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_5_cast_fp16 = reshape(shape = var_467, x = linear_13_cast_fp16)[name = tensor("kv_5_cast_fp16")]; tensor var_471_begin_0 = const()[name = tensor("op_471_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_471_end_0 = const()[name = tensor("op_471_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_471_end_mask_0 = const()[name = tensor("op_471_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_471_squeeze_mask_0 = const()[name = tensor("op_471_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_471_cast_fp16 = slice_by_index(begin = var_471_begin_0, end = var_471_end_0, end_mask = var_471_end_mask_0, squeeze_mask = var_471_squeeze_mask_0, x = kv_5_cast_fp16)[name = tensor("op_471_cast_fp16")]; tensor var_475_begin_0 = const()[name = tensor("op_475_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_475_end_0 = const()[name = tensor("op_475_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_475_end_mask_0 = const()[name = tensor("op_475_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_475_squeeze_mask_0 = const()[name = tensor("op_475_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_475_cast_fp16 = slice_by_index(begin = var_475_begin_0, end = var_475_end_0, end_mask = var_475_end_mask_0, squeeze_mask = var_475_squeeze_mask_0, x = kv_5_cast_fp16)[name = tensor("op_475_cast_fp16")]; tensor v_11_perm_0 = const()[name = tensor("v_11_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_478_transpose_x_0 = const()[name = tensor("op_478_transpose_x_0"), val = tensor(false)]; tensor var_478_transpose_y_0 = const()[name = tensor("op_478_transpose_y_0"), val = tensor(false)]; tensor transpose_76_perm_0 = const()[name = tensor("transpose_76_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_77_perm_0 = const()[name = tensor("transpose_77_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_77 = transpose(perm = transpose_77_perm_0, x = var_471_cast_fp16)[name = tensor("transpose_193")]; tensor transpose_76 = transpose(perm = transpose_76_perm_0, x = var_463_cast_fp16)[name = tensor("transpose_194")]; tensor var_478_cast_fp16 = matmul(transpose_x = var_478_transpose_x_0, transpose_y = var_478_transpose_y_0, x = transpose_76, y = transpose_77)[name = tensor("op_478_cast_fp16")]; tensor var_479_to_fp16 = const()[name = tensor("op_479_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_21_cast_fp16 = mul(x = var_478_cast_fp16, y = var_479_to_fp16)[name = tensor("attn_21_cast_fp16")]; tensor var_377_to_fp16 = const()[name = tensor("op_377_to_fp16"), val = tensor(-inf)]; tensor input_51_cast_fp16 = select(a = var_377_to_fp16, b = attn_21_cast_fp16, cond = var_151)[name = tensor("input_51_cast_fp16")]; tensor attn_23_cast_fp16 = softmax(axis = var_386, x = input_51_cast_fp16)[name = tensor("attn_23_cast_fp16")]; tensor out_11_transpose_x_0 = const()[name = tensor("out_11_transpose_x_0"), val = tensor(false)]; tensor out_11_transpose_y_0 = const()[name = tensor("out_11_transpose_y_0"), val = tensor(false)]; tensor v_11_cast_fp16 = transpose(perm = v_11_perm_0, x = var_475_cast_fp16)[name = tensor("transpose_195")]; tensor out_11_cast_fp16 = matmul(transpose_x = out_11_transpose_x_0, transpose_y = out_11_transpose_y_0, x = attn_23_cast_fp16, y = v_11_cast_fp16)[name = tensor("out_11_cast_fp16")]; tensor var_487_perm_0 = const()[name = tensor("op_487_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_488 = const()[name = tensor("op_488"), val = tensor([1, 110, -1])]; tensor var_487_cast_fp16 = transpose(perm = var_487_perm_0, x = out_11_cast_fp16)[name = tensor("transpose_192")]; tensor input_53_cast_fp16 = reshape(shape = var_488, x = var_487_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor layers_2_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_2_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35436352)))]; tensor linear_14_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_2_cross_attn_o_proj_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor input_55_cast_fp16 = add(x = input_49_cast_fp16, y = linear_14_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor x_25_axes_0 = const()[name = tensor("x_25_axes_0"), val = tensor([-1])]; tensor layers_2_norm_ff_weight_to_fp16 = const()[name = tensor("layers_2_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35633024)))]; tensor x_25_cast_fp16 = layer_norm(axes = x_25_axes_0, epsilon = var_393_to_fp16, gamma = layers_2_norm_ff_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor input_57_perm_0 = const()[name = tensor("input_57_perm_0"), val = tensor([0, 2, 1])]; tensor input_59_pad_type_0 = const()[name = tensor("input_59_pad_type_0"), val = tensor("valid")]; tensor input_59_strides_0 = const()[name = tensor("input_59_strides_0"), val = tensor([1])]; tensor input_59_pad_0 = const()[name = tensor("input_59_pad_0"), val = tensor([0, 0])]; tensor input_59_dilations_0 = const()[name = tensor("input_59_dilations_0"), val = tensor([1])]; tensor input_59_groups_0 = const()[name = tensor("input_59_groups_0"), val = tensor(1)]; tensor layers_2_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_2_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35634624)))]; tensor input_57_cast_fp16 = transpose(perm = input_57_perm_0, x = x_25_cast_fp16)[name = tensor("transpose_191")]; tensor input_59_cast_fp16 = conv(dilations = input_59_dilations_0, groups = input_59_groups_0, pad = input_59_pad_0, pad_type = input_59_pad_type_0, strides = input_59_strides_0, weight = layers_2_ffn_conv1_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor input_61_mode_0 = const()[name = tensor("input_61_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_61_cast_fp16 = gelu(mode = input_61_mode_0, x = input_59_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor x_27_pad_type_0 = const()[name = tensor("x_27_pad_type_0"), val = tensor("valid")]; tensor x_27_strides_0 = const()[name = tensor("x_27_strides_0"), val = tensor([1])]; tensor x_27_pad_0 = const()[name = tensor("x_27_pad_0"), val = tensor([0, 0])]; tensor x_27_dilations_0 = const()[name = tensor("x_27_dilations_0"), val = tensor([1])]; tensor x_27_groups_0 = const()[name = tensor("x_27_groups_0"), val = tensor(1)]; tensor layers_2_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_2_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40353280)))]; tensor x_27_cast_fp16 = conv(dilations = x_27_dilations_0, groups = x_27_groups_0, pad = x_27_pad_0, pad_type = x_27_pad_type_0, strides = x_27_strides_0, weight = layers_2_ffn_conv2_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("x_27_cast_fp16")]; tensor x_29_perm_0 = const()[name = tensor("x_29_perm_0"), val = tensor([0, 2, 1])]; tensor x_29_cast_fp16 = transpose(perm = x_29_perm_0, x = x_27_cast_fp16)[name = tensor("transpose_190")]; tensor input_63_cast_fp16 = add(x = input_55_cast_fp16, y = x_29_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor k_padded_5_pad_0 = const()[name = tensor("k_padded_5_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_5_mode_0 = const()[name = tensor("k_padded_5_mode_0"), val = tensor("constant")]; tensor const_21_to_fp16 = const()[name = tensor("const_21_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_5_cast_fp16 = pad(constant_val = const_21_to_fp16, mode = k_padded_5_mode_0, pad = k_padded_5_pad_0, x = k_9_cast_fp16)[name = tensor("k_padded_5_cast_fp16")]; tensor v_padded_5_pad_0 = const()[name = tensor("v_padded_5_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_5_mode_0 = const()[name = tensor("v_padded_5_mode_0"), val = tensor("constant")]; tensor const_22_to_fp16 = const()[name = tensor("const_22_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_5_cast_fp16 = pad(constant_val = const_22_to_fp16, mode = v_padded_5_mode_0, pad = v_padded_5_pad_0, x = v_9_cast_fp16)[name = tensor("v_padded_5_cast_fp16")]; tensor var_540_axis_0 = const()[name = tensor("op_540_axis_0"), val = tensor(0)]; tensor var_540 = stack(axis = var_540_axis_0, values = (k_padded_5_cast_fp16, v_padded_5_cast_fp16))[name = tensor("op_540_cast_fp16")]; tensor var_552 = const()[name = tensor("op_552"), val = tensor(-1)]; tensor x_31_axes_0 = const()[name = tensor("x_31_axes_0"), val = tensor([-1])]; tensor layers_3_norm_sa_weight_to_fp16 = const()[name = tensor("layers_3_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45071936)))]; tensor var_559_to_fp16 = const()[name = tensor("op_559_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_31_cast_fp16 = layer_norm(axes = x_31_axes_0, epsilon = var_559_to_fp16, gamma = layers_3_norm_sa_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor layers_3_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_3_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45073536)))]; tensor linear_15_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_3_self_attn_qkv_proj_weight_to_fp16, x = x_31_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor var_577 = const()[name = tensor("op_577"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_7_cast_fp16 = reshape(shape = var_577, x = linear_15_cast_fp16)[name = tensor("qkv_7_cast_fp16")]; tensor q_19_begin_0 = const()[name = tensor("q_19_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_19_end_0 = const()[name = tensor("q_19_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_19_end_mask_0 = const()[name = tensor("q_19_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_19_squeeze_mask_0 = const()[name = tensor("q_19_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_19_cast_fp16 = slice_by_index(begin = q_19_begin_0, end = q_19_end_0, end_mask = q_19_end_mask_0, squeeze_mask = q_19_squeeze_mask_0, x = qkv_7_cast_fp16)[name = tensor("q_19_cast_fp16")]; tensor k_13_begin_0 = const()[name = tensor("k_13_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_13_end_0 = const()[name = tensor("k_13_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_13_end_mask_0 = const()[name = tensor("k_13_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_13_squeeze_mask_0 = const()[name = tensor("k_13_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_13_cast_fp16 = slice_by_index(begin = k_13_begin_0, end = k_13_end_0, end_mask = k_13_end_mask_0, squeeze_mask = k_13_squeeze_mask_0, x = qkv_7_cast_fp16)[name = tensor("k_13_cast_fp16")]; tensor v_13_begin_0 = const()[name = tensor("v_13_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_13_end_0 = const()[name = tensor("v_13_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_13_end_mask_0 = const()[name = tensor("v_13_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_13_squeeze_mask_0 = const()[name = tensor("v_13_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_13_cast_fp16 = slice_by_index(begin = v_13_begin_0, end = v_13_end_0, end_mask = v_13_end_mask_0, squeeze_mask = v_13_squeeze_mask_0, x = qkv_7_cast_fp16)[name = tensor("v_13_cast_fp16")]; tensor v_t_7_perm_0 = const()[name = tensor("v_t_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_592_transpose_x_0 = const()[name = tensor("op_592_transpose_x_0"), val = tensor(false)]; tensor var_592_transpose_y_0 = const()[name = tensor("op_592_transpose_y_0"), val = tensor(false)]; tensor transpose_78_perm_0 = const()[name = tensor("transpose_78_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_79_perm_0 = const()[name = tensor("transpose_79_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_79 = transpose(perm = transpose_79_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_187")]; tensor transpose_78 = transpose(perm = transpose_78_perm_0, x = q_19_cast_fp16)[name = tensor("transpose_188")]; tensor var_592_cast_fp16 = matmul(transpose_x = var_592_transpose_x_0, transpose_y = var_592_transpose_y_0, x = transpose_78, y = transpose_79)[name = tensor("op_592_cast_fp16")]; tensor var_593_to_fp16 = const()[name = tensor("op_593_to_fp16"), val = tensor(0x1p-3)]; tensor attn_25_cast_fp16 = mul(x = var_592_cast_fp16, y = var_593_to_fp16)[name = tensor("attn_25_cast_fp16")]; tensor attn_25_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_25_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_25_cast_fp16_to_fp32 = cast(dtype = attn_25_cast_fp16_to_fp32_dtype_0, x = attn_25_cast_fp16)[name = tensor("cast_87")]; tensor input_65 = add(x = attn_25_cast_fp16_to_fp32, y = var_102)[name = tensor("input_65")]; tensor input_65_to_fp16_dtype_0 = const()[name = tensor("input_65_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_65_to_fp16 = cast(dtype = input_65_to_fp16_dtype_0, x = input_65)[name = tensor("cast_86")]; tensor attn_27_cast_fp16 = softmax(axis = var_552, x = input_65_to_fp16)[name = tensor("attn_27_cast_fp16")]; tensor out_13_transpose_x_0 = const()[name = tensor("out_13_transpose_x_0"), val = tensor(false)]; tensor out_13_transpose_y_0 = const()[name = tensor("out_13_transpose_y_0"), val = tensor(false)]; tensor v_t_7_cast_fp16 = transpose(perm = v_t_7_perm_0, x = v_13_cast_fp16)[name = tensor("transpose_189")]; tensor out_13_cast_fp16 = matmul(transpose_x = out_13_transpose_x_0, transpose_y = out_13_transpose_y_0, x = attn_27_cast_fp16, y = v_t_7_cast_fp16)[name = tensor("out_13_cast_fp16")]; tensor var_604_perm_0 = const()[name = tensor("op_604_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_605 = const()[name = tensor("op_605"), val = tensor([1, 110, -1])]; tensor var_604_cast_fp16 = transpose(perm = var_604_perm_0, x = out_13_cast_fp16)[name = tensor("transpose_186")]; tensor input_67_cast_fp16 = reshape(shape = var_605, x = var_604_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor layers_3_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_3_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48612544)))]; tensor linear_16_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_3_self_attn_o_proj_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_69_cast_fp16 = add(x = input_63_cast_fp16, y = linear_16_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor x_33_axes_0 = const()[name = tensor("x_33_axes_0"), val = tensor([-1])]; tensor layers_3_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_3_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49792256)))]; tensor x_33_cast_fp16 = layer_norm(axes = x_33_axes_0, epsilon = var_559_to_fp16, gamma = layers_3_norm_xa_query_weight_to_fp16, x = input_69_cast_fp16)[name = tensor("x_33_cast_fp16")]; tensor memory_7_axes_0 = const()[name = tensor("memory_7_axes_0"), val = tensor([-1])]; tensor layers_3_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_3_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49793856)))]; tensor memory_7_cast_fp16 = layer_norm(axes = memory_7_axes_0, epsilon = var_559_to_fp16, gamma = layers_3_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_7_cast_fp16")]; tensor layers_3_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_3_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49795456)))]; tensor linear_17_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_3_cross_attn_q_proj_weight_to_fp16, x = x_33_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor var_628 = const()[name = tensor("op_628"), val = tensor([1, 110, 1, 128])]; tensor var_629_cast_fp16 = reshape(shape = var_628, x = linear_17_cast_fp16)[name = tensor("op_629_cast_fp16")]; tensor layers_3_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_3_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49992128)))]; tensor linear_18_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_3_cross_attn_kv_proj_weight_to_fp16, x = memory_7_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_633 = const()[name = tensor("op_633"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_7_cast_fp16 = reshape(shape = var_633, x = linear_18_cast_fp16)[name = tensor("kv_7_cast_fp16")]; tensor var_637_begin_0 = const()[name = tensor("op_637_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_637_end_0 = const()[name = tensor("op_637_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_637_end_mask_0 = const()[name = tensor("op_637_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_637_squeeze_mask_0 = const()[name = tensor("op_637_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_637_cast_fp16 = slice_by_index(begin = var_637_begin_0, end = var_637_end_0, end_mask = var_637_end_mask_0, squeeze_mask = var_637_squeeze_mask_0, x = kv_7_cast_fp16)[name = tensor("op_637_cast_fp16")]; tensor var_641_begin_0 = const()[name = tensor("op_641_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_641_end_0 = const()[name = tensor("op_641_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_641_end_mask_0 = const()[name = tensor("op_641_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_641_squeeze_mask_0 = const()[name = tensor("op_641_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_641_cast_fp16 = slice_by_index(begin = var_641_begin_0, end = var_641_end_0, end_mask = var_641_end_mask_0, squeeze_mask = var_641_squeeze_mask_0, x = kv_7_cast_fp16)[name = tensor("op_641_cast_fp16")]; tensor v_15_perm_0 = const()[name = tensor("v_15_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_644_transpose_x_0 = const()[name = tensor("op_644_transpose_x_0"), val = tensor(false)]; tensor var_644_transpose_y_0 = const()[name = tensor("op_644_transpose_y_0"), val = tensor(false)]; tensor transpose_80_perm_0 = const()[name = tensor("transpose_80_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_81_perm_0 = const()[name = tensor("transpose_81_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_81 = transpose(perm = transpose_81_perm_0, x = var_637_cast_fp16)[name = tensor("transpose_183")]; tensor transpose_80 = transpose(perm = transpose_80_perm_0, x = var_629_cast_fp16)[name = tensor("transpose_184")]; tensor var_644_cast_fp16 = matmul(transpose_x = var_644_transpose_x_0, transpose_y = var_644_transpose_y_0, x = transpose_80, y = transpose_81)[name = tensor("op_644_cast_fp16")]; tensor var_645_to_fp16 = const()[name = tensor("op_645_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_29_cast_fp16 = mul(x = var_644_cast_fp16, y = var_645_to_fp16)[name = tensor("attn_29_cast_fp16")]; tensor var_543_to_fp16 = const()[name = tensor("op_543_to_fp16"), val = tensor(-inf)]; tensor input_71_cast_fp16 = select(a = var_543_to_fp16, b = attn_29_cast_fp16, cond = var_151)[name = tensor("input_71_cast_fp16")]; tensor attn_31_cast_fp16 = softmax(axis = var_552, x = input_71_cast_fp16)[name = tensor("attn_31_cast_fp16")]; tensor out_15_transpose_x_0 = const()[name = tensor("out_15_transpose_x_0"), val = tensor(false)]; tensor out_15_transpose_y_0 = const()[name = tensor("out_15_transpose_y_0"), val = tensor(false)]; tensor v_15_cast_fp16 = transpose(perm = v_15_perm_0, x = var_641_cast_fp16)[name = tensor("transpose_185")]; tensor out_15_cast_fp16 = matmul(transpose_x = out_15_transpose_x_0, transpose_y = out_15_transpose_y_0, x = attn_31_cast_fp16, y = v_15_cast_fp16)[name = tensor("out_15_cast_fp16")]; tensor var_653_perm_0 = const()[name = tensor("op_653_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_654 = const()[name = tensor("op_654"), val = tensor([1, 110, -1])]; tensor var_653_cast_fp16 = transpose(perm = var_653_perm_0, x = out_15_cast_fp16)[name = tensor("transpose_182")]; tensor input_73_cast_fp16 = reshape(shape = var_654, x = var_653_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor layers_3_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_3_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50385408)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_3_cross_attn_o_proj_weight_to_fp16, x = input_73_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_69_cast_fp16, y = linear_19_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor x_35_axes_0 = const()[name = tensor("x_35_axes_0"), val = tensor([-1])]; tensor layers_3_norm_ff_weight_to_fp16 = const()[name = tensor("layers_3_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50582080)))]; tensor x_35_cast_fp16 = layer_norm(axes = x_35_axes_0, epsilon = var_559_to_fp16, gamma = layers_3_norm_ff_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("x_35_cast_fp16")]; tensor input_77_perm_0 = const()[name = tensor("input_77_perm_0"), val = tensor([0, 2, 1])]; tensor input_79_pad_type_0 = const()[name = tensor("input_79_pad_type_0"), val = tensor("valid")]; tensor input_79_strides_0 = const()[name = tensor("input_79_strides_0"), val = tensor([1])]; tensor input_79_pad_0 = const()[name = tensor("input_79_pad_0"), val = tensor([0, 0])]; tensor input_79_dilations_0 = const()[name = tensor("input_79_dilations_0"), val = tensor([1])]; tensor input_79_groups_0 = const()[name = tensor("input_79_groups_0"), val = tensor(1)]; tensor layers_3_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_3_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50583680)))]; tensor input_77_cast_fp16 = transpose(perm = input_77_perm_0, x = x_35_cast_fp16)[name = tensor("transpose_181")]; tensor input_79_cast_fp16 = conv(dilations = input_79_dilations_0, groups = input_79_groups_0, pad = input_79_pad_0, pad_type = input_79_pad_type_0, strides = input_79_strides_0, weight = layers_3_ffn_conv1_weight_to_fp16, x = input_77_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor input_81_mode_0 = const()[name = tensor("input_81_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_81_cast_fp16 = gelu(mode = input_81_mode_0, x = input_79_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor x_37_pad_type_0 = const()[name = tensor("x_37_pad_type_0"), val = tensor("valid")]; tensor x_37_strides_0 = const()[name = tensor("x_37_strides_0"), val = tensor([1])]; tensor x_37_pad_0 = const()[name = tensor("x_37_pad_0"), val = tensor([0, 0])]; tensor x_37_dilations_0 = const()[name = tensor("x_37_dilations_0"), val = tensor([1])]; tensor x_37_groups_0 = const()[name = tensor("x_37_groups_0"), val = tensor(1)]; tensor layers_3_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_3_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55302336)))]; tensor x_37_cast_fp16 = conv(dilations = x_37_dilations_0, groups = x_37_groups_0, pad = x_37_pad_0, pad_type = x_37_pad_type_0, strides = x_37_strides_0, weight = layers_3_ffn_conv2_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor x_39_perm_0 = const()[name = tensor("x_39_perm_0"), val = tensor([0, 2, 1])]; tensor x_39_cast_fp16 = transpose(perm = x_39_perm_0, x = x_37_cast_fp16)[name = tensor("transpose_180")]; tensor input_83_cast_fp16 = add(x = input_75_cast_fp16, y = x_39_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor k_padded_7_pad_0 = const()[name = tensor("k_padded_7_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_7_mode_0 = const()[name = tensor("k_padded_7_mode_0"), val = tensor("constant")]; tensor const_28_to_fp16 = const()[name = tensor("const_28_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_7_cast_fp16 = pad(constant_val = const_28_to_fp16, mode = k_padded_7_mode_0, pad = k_padded_7_pad_0, x = k_13_cast_fp16)[name = tensor("k_padded_7_cast_fp16")]; tensor v_padded_7_pad_0 = const()[name = tensor("v_padded_7_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_7_mode_0 = const()[name = tensor("v_padded_7_mode_0"), val = tensor("constant")]; tensor const_29_to_fp16 = const()[name = tensor("const_29_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_7_cast_fp16 = pad(constant_val = const_29_to_fp16, mode = v_padded_7_mode_0, pad = v_padded_7_pad_0, x = v_13_cast_fp16)[name = tensor("v_padded_7_cast_fp16")]; tensor var_706_axis_0 = const()[name = tensor("op_706_axis_0"), val = tensor(0)]; tensor var_706 = stack(axis = var_706_axis_0, values = (k_padded_7_cast_fp16, v_padded_7_cast_fp16))[name = tensor("op_706_cast_fp16")]; tensor var_718 = const()[name = tensor("op_718"), val = tensor(-1)]; tensor x_41_axes_0 = const()[name = tensor("x_41_axes_0"), val = tensor([-1])]; tensor layers_4_norm_sa_weight_to_fp16 = const()[name = tensor("layers_4_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60020992)))]; tensor var_725_to_fp16 = const()[name = tensor("op_725_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_41_cast_fp16 = layer_norm(axes = x_41_axes_0, epsilon = var_725_to_fp16, gamma = layers_4_norm_sa_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor layers_4_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_4_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60022592)))]; tensor linear_20_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_4_self_attn_qkv_proj_weight_to_fp16, x = x_41_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_743 = const()[name = tensor("op_743"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_9_cast_fp16 = reshape(shape = var_743, x = linear_20_cast_fp16)[name = tensor("qkv_9_cast_fp16")]; tensor q_25_begin_0 = const()[name = tensor("q_25_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_25_end_0 = const()[name = tensor("q_25_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_25_end_mask_0 = const()[name = tensor("q_25_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_25_squeeze_mask_0 = const()[name = tensor("q_25_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_25_cast_fp16 = slice_by_index(begin = q_25_begin_0, end = q_25_end_0, end_mask = q_25_end_mask_0, squeeze_mask = q_25_squeeze_mask_0, x = qkv_9_cast_fp16)[name = tensor("q_25_cast_fp16")]; tensor k_17_begin_0 = const()[name = tensor("k_17_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_17_end_0 = const()[name = tensor("k_17_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_17_end_mask_0 = const()[name = tensor("k_17_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_17_squeeze_mask_0 = const()[name = tensor("k_17_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_17_cast_fp16 = slice_by_index(begin = k_17_begin_0, end = k_17_end_0, end_mask = k_17_end_mask_0, squeeze_mask = k_17_squeeze_mask_0, x = qkv_9_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor v_17_begin_0 = const()[name = tensor("v_17_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_17_end_0 = const()[name = tensor("v_17_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_17_end_mask_0 = const()[name = tensor("v_17_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_17_squeeze_mask_0 = const()[name = tensor("v_17_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_17_cast_fp16 = slice_by_index(begin = v_17_begin_0, end = v_17_end_0, end_mask = v_17_end_mask_0, squeeze_mask = v_17_squeeze_mask_0, x = qkv_9_cast_fp16)[name = tensor("v_17_cast_fp16")]; tensor v_t_9_perm_0 = const()[name = tensor("v_t_9_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_758_transpose_x_0 = const()[name = tensor("op_758_transpose_x_0"), val = tensor(false)]; tensor var_758_transpose_y_0 = const()[name = tensor("op_758_transpose_y_0"), val = tensor(false)]; tensor transpose_82_perm_0 = const()[name = tensor("transpose_82_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_83_perm_0 = const()[name = tensor("transpose_83_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_83 = transpose(perm = transpose_83_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_177")]; tensor transpose_82 = transpose(perm = transpose_82_perm_0, x = q_25_cast_fp16)[name = tensor("transpose_178")]; tensor var_758_cast_fp16 = matmul(transpose_x = var_758_transpose_x_0, transpose_y = var_758_transpose_y_0, x = transpose_82, y = transpose_83)[name = tensor("op_758_cast_fp16")]; tensor var_759_to_fp16 = const()[name = tensor("op_759_to_fp16"), val = tensor(0x1p-3)]; tensor attn_33_cast_fp16 = mul(x = var_758_cast_fp16, y = var_759_to_fp16)[name = tensor("attn_33_cast_fp16")]; tensor attn_33_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_33_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_33_cast_fp16_to_fp32 = cast(dtype = attn_33_cast_fp16_to_fp32_dtype_0, x = attn_33_cast_fp16)[name = tensor("cast_85")]; tensor input_85 = add(x = attn_33_cast_fp16_to_fp32, y = var_102)[name = tensor("input_85")]; tensor input_85_to_fp16_dtype_0 = const()[name = tensor("input_85_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_85_to_fp16 = cast(dtype = input_85_to_fp16_dtype_0, x = input_85)[name = tensor("cast_84")]; tensor attn_35_cast_fp16 = softmax(axis = var_718, x = input_85_to_fp16)[name = tensor("attn_35_cast_fp16")]; tensor out_17_transpose_x_0 = const()[name = tensor("out_17_transpose_x_0"), val = tensor(false)]; tensor out_17_transpose_y_0 = const()[name = tensor("out_17_transpose_y_0"), val = tensor(false)]; tensor v_t_9_cast_fp16 = transpose(perm = v_t_9_perm_0, x = v_17_cast_fp16)[name = tensor("transpose_179")]; tensor out_17_cast_fp16 = matmul(transpose_x = out_17_transpose_x_0, transpose_y = out_17_transpose_y_0, x = attn_35_cast_fp16, y = v_t_9_cast_fp16)[name = tensor("out_17_cast_fp16")]; tensor var_770_perm_0 = const()[name = tensor("op_770_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_771 = const()[name = tensor("op_771"), val = tensor([1, 110, -1])]; tensor var_770_cast_fp16 = transpose(perm = var_770_perm_0, x = out_17_cast_fp16)[name = tensor("transpose_176")]; tensor input_87_cast_fp16 = reshape(shape = var_771, x = var_770_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor layers_4_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_4_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63561600)))]; tensor linear_21_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_4_self_attn_o_proj_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor input_89_cast_fp16 = add(x = input_83_cast_fp16, y = linear_21_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor x_43_axes_0 = const()[name = tensor("x_43_axes_0"), val = tensor([-1])]; tensor layers_4_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_4_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64741312)))]; tensor x_43_cast_fp16 = layer_norm(axes = x_43_axes_0, epsilon = var_725_to_fp16, gamma = layers_4_norm_xa_query_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor memory_9_axes_0 = const()[name = tensor("memory_9_axes_0"), val = tensor([-1])]; tensor layers_4_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_4_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64742912)))]; tensor memory_9_cast_fp16 = layer_norm(axes = memory_9_axes_0, epsilon = var_725_to_fp16, gamma = layers_4_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_9_cast_fp16")]; tensor layers_4_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_4_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64744512)))]; tensor linear_22_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_4_cross_attn_q_proj_weight_to_fp16, x = x_43_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor var_794 = const()[name = tensor("op_794"), val = tensor([1, 110, 1, 128])]; tensor var_795_cast_fp16 = reshape(shape = var_794, x = linear_22_cast_fp16)[name = tensor("op_795_cast_fp16")]; tensor layers_4_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_4_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64941184)))]; tensor linear_23_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_4_cross_attn_kv_proj_weight_to_fp16, x = memory_9_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor var_799 = const()[name = tensor("op_799"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_9_cast_fp16 = reshape(shape = var_799, x = linear_23_cast_fp16)[name = tensor("kv_9_cast_fp16")]; tensor var_803_begin_0 = const()[name = tensor("op_803_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_803_end_0 = const()[name = tensor("op_803_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_803_end_mask_0 = const()[name = tensor("op_803_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_803_squeeze_mask_0 = const()[name = tensor("op_803_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_803_cast_fp16 = slice_by_index(begin = var_803_begin_0, end = var_803_end_0, end_mask = var_803_end_mask_0, squeeze_mask = var_803_squeeze_mask_0, x = kv_9_cast_fp16)[name = tensor("op_803_cast_fp16")]; tensor var_807_begin_0 = const()[name = tensor("op_807_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_807_end_0 = const()[name = tensor("op_807_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_807_end_mask_0 = const()[name = tensor("op_807_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_807_squeeze_mask_0 = const()[name = tensor("op_807_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_807_cast_fp16 = slice_by_index(begin = var_807_begin_0, end = var_807_end_0, end_mask = var_807_end_mask_0, squeeze_mask = var_807_squeeze_mask_0, x = kv_9_cast_fp16)[name = tensor("op_807_cast_fp16")]; tensor v_19_perm_0 = const()[name = tensor("v_19_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_810_transpose_x_0 = const()[name = tensor("op_810_transpose_x_0"), val = tensor(false)]; tensor var_810_transpose_y_0 = const()[name = tensor("op_810_transpose_y_0"), val = tensor(false)]; tensor transpose_84_perm_0 = const()[name = tensor("transpose_84_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_85_perm_0 = const()[name = tensor("transpose_85_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_85 = transpose(perm = transpose_85_perm_0, x = var_803_cast_fp16)[name = tensor("transpose_173")]; tensor transpose_84 = transpose(perm = transpose_84_perm_0, x = var_795_cast_fp16)[name = tensor("transpose_174")]; tensor var_810_cast_fp16 = matmul(transpose_x = var_810_transpose_x_0, transpose_y = var_810_transpose_y_0, x = transpose_84, y = transpose_85)[name = tensor("op_810_cast_fp16")]; tensor var_811_to_fp16 = const()[name = tensor("op_811_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_37_cast_fp16 = mul(x = var_810_cast_fp16, y = var_811_to_fp16)[name = tensor("attn_37_cast_fp16")]; tensor var_709_to_fp16 = const()[name = tensor("op_709_to_fp16"), val = tensor(-inf)]; tensor input_91_cast_fp16 = select(a = var_709_to_fp16, b = attn_37_cast_fp16, cond = var_151)[name = tensor("input_91_cast_fp16")]; tensor attn_39_cast_fp16 = softmax(axis = var_718, x = input_91_cast_fp16)[name = tensor("attn_39_cast_fp16")]; tensor out_19_transpose_x_0 = const()[name = tensor("out_19_transpose_x_0"), val = tensor(false)]; tensor out_19_transpose_y_0 = const()[name = tensor("out_19_transpose_y_0"), val = tensor(false)]; tensor v_19_cast_fp16 = transpose(perm = v_19_perm_0, x = var_807_cast_fp16)[name = tensor("transpose_175")]; tensor out_19_cast_fp16 = matmul(transpose_x = out_19_transpose_x_0, transpose_y = out_19_transpose_y_0, x = attn_39_cast_fp16, y = v_19_cast_fp16)[name = tensor("out_19_cast_fp16")]; tensor var_819_perm_0 = const()[name = tensor("op_819_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_820 = const()[name = tensor("op_820"), val = tensor([1, 110, -1])]; tensor var_819_cast_fp16 = transpose(perm = var_819_perm_0, x = out_19_cast_fp16)[name = tensor("transpose_172")]; tensor input_93_cast_fp16 = reshape(shape = var_820, x = var_819_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor layers_4_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_4_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65334464)))]; tensor linear_24_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_4_cross_attn_o_proj_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor input_95_cast_fp16 = add(x = input_89_cast_fp16, y = linear_24_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor x_45_axes_0 = const()[name = tensor("x_45_axes_0"), val = tensor([-1])]; tensor layers_4_norm_ff_weight_to_fp16 = const()[name = tensor("layers_4_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65531136)))]; tensor x_45_cast_fp16 = layer_norm(axes = x_45_axes_0, epsilon = var_725_to_fp16, gamma = layers_4_norm_ff_weight_to_fp16, x = input_95_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor input_97_perm_0 = const()[name = tensor("input_97_perm_0"), val = tensor([0, 2, 1])]; tensor input_99_pad_type_0 = const()[name = tensor("input_99_pad_type_0"), val = tensor("valid")]; tensor input_99_strides_0 = const()[name = tensor("input_99_strides_0"), val = tensor([1])]; tensor input_99_pad_0 = const()[name = tensor("input_99_pad_0"), val = tensor([0, 0])]; tensor input_99_dilations_0 = const()[name = tensor("input_99_dilations_0"), val = tensor([1])]; tensor input_99_groups_0 = const()[name = tensor("input_99_groups_0"), val = tensor(1)]; tensor layers_4_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_4_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65532736)))]; tensor input_97_cast_fp16 = transpose(perm = input_97_perm_0, x = x_45_cast_fp16)[name = tensor("transpose_171")]; tensor input_99_cast_fp16 = conv(dilations = input_99_dilations_0, groups = input_99_groups_0, pad = input_99_pad_0, pad_type = input_99_pad_type_0, strides = input_99_strides_0, weight = layers_4_ffn_conv1_weight_to_fp16, x = input_97_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor input_101_mode_0 = const()[name = tensor("input_101_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_101_cast_fp16 = gelu(mode = input_101_mode_0, x = input_99_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor x_47_pad_type_0 = const()[name = tensor("x_47_pad_type_0"), val = tensor("valid")]; tensor x_47_strides_0 = const()[name = tensor("x_47_strides_0"), val = tensor([1])]; tensor x_47_pad_0 = const()[name = tensor("x_47_pad_0"), val = tensor([0, 0])]; tensor x_47_dilations_0 = const()[name = tensor("x_47_dilations_0"), val = tensor([1])]; tensor x_47_groups_0 = const()[name = tensor("x_47_groups_0"), val = tensor(1)]; tensor layers_4_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_4_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70251392)))]; tensor x_47_cast_fp16 = conv(dilations = x_47_dilations_0, groups = x_47_groups_0, pad = x_47_pad_0, pad_type = x_47_pad_type_0, strides = x_47_strides_0, weight = layers_4_ffn_conv2_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor x_49_perm_0 = const()[name = tensor("x_49_perm_0"), val = tensor([0, 2, 1])]; tensor x_49_cast_fp16 = transpose(perm = x_49_perm_0, x = x_47_cast_fp16)[name = tensor("transpose_170")]; tensor input_103_cast_fp16 = add(x = input_95_cast_fp16, y = x_49_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor k_padded_9_pad_0 = const()[name = tensor("k_padded_9_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_9_mode_0 = const()[name = tensor("k_padded_9_mode_0"), val = tensor("constant")]; tensor const_35_to_fp16 = const()[name = tensor("const_35_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_9_cast_fp16 = pad(constant_val = const_35_to_fp16, mode = k_padded_9_mode_0, pad = k_padded_9_pad_0, x = k_17_cast_fp16)[name = tensor("k_padded_9_cast_fp16")]; tensor v_padded_9_pad_0 = const()[name = tensor("v_padded_9_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_9_mode_0 = const()[name = tensor("v_padded_9_mode_0"), val = tensor("constant")]; tensor const_36_to_fp16 = const()[name = tensor("const_36_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_9_cast_fp16 = pad(constant_val = const_36_to_fp16, mode = v_padded_9_mode_0, pad = v_padded_9_pad_0, x = v_17_cast_fp16)[name = tensor("v_padded_9_cast_fp16")]; tensor var_872_axis_0 = const()[name = tensor("op_872_axis_0"), val = tensor(0)]; tensor var_872 = stack(axis = var_872_axis_0, values = (k_padded_9_cast_fp16, v_padded_9_cast_fp16))[name = tensor("op_872_cast_fp16")]; tensor var_884 = const()[name = tensor("op_884"), val = tensor(-1)]; tensor x_51_axes_0 = const()[name = tensor("x_51_axes_0"), val = tensor([-1])]; tensor layers_5_norm_sa_weight_to_fp16 = const()[name = tensor("layers_5_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74970048)))]; tensor var_891_to_fp16 = const()[name = tensor("op_891_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_51_cast_fp16 = layer_norm(axes = x_51_axes_0, epsilon = var_891_to_fp16, gamma = layers_5_norm_sa_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("x_51_cast_fp16")]; tensor layers_5_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_5_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74971648)))]; tensor linear_25_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_5_self_attn_qkv_proj_weight_to_fp16, x = x_51_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor var_909 = const()[name = tensor("op_909"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_11_cast_fp16 = reshape(shape = var_909, x = linear_25_cast_fp16)[name = tensor("qkv_11_cast_fp16")]; tensor q_31_begin_0 = const()[name = tensor("q_31_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_31_end_0 = const()[name = tensor("q_31_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_31_end_mask_0 = const()[name = tensor("q_31_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_31_squeeze_mask_0 = const()[name = tensor("q_31_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_31_cast_fp16 = slice_by_index(begin = q_31_begin_0, end = q_31_end_0, end_mask = q_31_end_mask_0, squeeze_mask = q_31_squeeze_mask_0, x = qkv_11_cast_fp16)[name = tensor("q_31_cast_fp16")]; tensor k_21_begin_0 = const()[name = tensor("k_21_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_21_end_0 = const()[name = tensor("k_21_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_21_end_mask_0 = const()[name = tensor("k_21_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_21_squeeze_mask_0 = const()[name = tensor("k_21_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_21_cast_fp16 = slice_by_index(begin = k_21_begin_0, end = k_21_end_0, end_mask = k_21_end_mask_0, squeeze_mask = k_21_squeeze_mask_0, x = qkv_11_cast_fp16)[name = tensor("k_21_cast_fp16")]; tensor v_21_begin_0 = const()[name = tensor("v_21_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_21_end_0 = const()[name = tensor("v_21_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_21_end_mask_0 = const()[name = tensor("v_21_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_21_squeeze_mask_0 = const()[name = tensor("v_21_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_21_cast_fp16 = slice_by_index(begin = v_21_begin_0, end = v_21_end_0, end_mask = v_21_end_mask_0, squeeze_mask = v_21_squeeze_mask_0, x = qkv_11_cast_fp16)[name = tensor("v_21_cast_fp16")]; tensor v_t_11_perm_0 = const()[name = tensor("v_t_11_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_924_transpose_x_0 = const()[name = tensor("op_924_transpose_x_0"), val = tensor(false)]; tensor var_924_transpose_y_0 = const()[name = tensor("op_924_transpose_y_0"), val = tensor(false)]; tensor transpose_86_perm_0 = const()[name = tensor("transpose_86_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_87_perm_0 = const()[name = tensor("transpose_87_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_87 = transpose(perm = transpose_87_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_167")]; tensor transpose_86 = transpose(perm = transpose_86_perm_0, x = q_31_cast_fp16)[name = tensor("transpose_168")]; tensor var_924_cast_fp16 = matmul(transpose_x = var_924_transpose_x_0, transpose_y = var_924_transpose_y_0, x = transpose_86, y = transpose_87)[name = tensor("op_924_cast_fp16")]; tensor var_925_to_fp16 = const()[name = tensor("op_925_to_fp16"), val = tensor(0x1p-3)]; tensor attn_41_cast_fp16 = mul(x = var_924_cast_fp16, y = var_925_to_fp16)[name = tensor("attn_41_cast_fp16")]; tensor attn_41_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_41_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_41_cast_fp16_to_fp32 = cast(dtype = attn_41_cast_fp16_to_fp32_dtype_0, x = attn_41_cast_fp16)[name = tensor("cast_83")]; tensor input_105 = add(x = attn_41_cast_fp16_to_fp32, y = var_102)[name = tensor("input_105")]; tensor input_105_to_fp16_dtype_0 = const()[name = tensor("input_105_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_105_to_fp16 = cast(dtype = input_105_to_fp16_dtype_0, x = input_105)[name = tensor("cast_82")]; tensor attn_43_cast_fp16 = softmax(axis = var_884, x = input_105_to_fp16)[name = tensor("attn_43_cast_fp16")]; tensor out_21_transpose_x_0 = const()[name = tensor("out_21_transpose_x_0"), val = tensor(false)]; tensor out_21_transpose_y_0 = const()[name = tensor("out_21_transpose_y_0"), val = tensor(false)]; tensor v_t_11_cast_fp16 = transpose(perm = v_t_11_perm_0, x = v_21_cast_fp16)[name = tensor("transpose_169")]; tensor out_21_cast_fp16 = matmul(transpose_x = out_21_transpose_x_0, transpose_y = out_21_transpose_y_0, x = attn_43_cast_fp16, y = v_t_11_cast_fp16)[name = tensor("out_21_cast_fp16")]; tensor var_936_perm_0 = const()[name = tensor("op_936_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_937 = const()[name = tensor("op_937"), val = tensor([1, 110, -1])]; tensor var_936_cast_fp16 = transpose(perm = var_936_perm_0, x = out_21_cast_fp16)[name = tensor("transpose_166")]; tensor input_107_cast_fp16 = reshape(shape = var_937, x = var_936_cast_fp16)[name = tensor("input_107_cast_fp16")]; tensor layers_5_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_5_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78510656)))]; tensor linear_26_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_5_self_attn_o_proj_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor input_109_cast_fp16 = add(x = input_103_cast_fp16, y = linear_26_cast_fp16)[name = tensor("input_109_cast_fp16")]; tensor x_53_axes_0 = const()[name = tensor("x_53_axes_0"), val = tensor([-1])]; tensor layers_5_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_5_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79690368)))]; tensor x_53_cast_fp16 = layer_norm(axes = x_53_axes_0, epsilon = var_891_to_fp16, gamma = layers_5_norm_xa_query_weight_to_fp16, x = input_109_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor memory_11_axes_0 = const()[name = tensor("memory_11_axes_0"), val = tensor([-1])]; tensor layers_5_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_5_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79691968)))]; tensor memory_11_cast_fp16 = layer_norm(axes = memory_11_axes_0, epsilon = var_891_to_fp16, gamma = layers_5_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_11_cast_fp16")]; tensor layers_5_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_5_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79693568)))]; tensor linear_27_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_5_cross_attn_q_proj_weight_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor var_960 = const()[name = tensor("op_960"), val = tensor([1, 110, 1, 128])]; tensor var_961_cast_fp16 = reshape(shape = var_960, x = linear_27_cast_fp16)[name = tensor("op_961_cast_fp16")]; tensor layers_5_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_5_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79890240)))]; tensor linear_28_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_5_cross_attn_kv_proj_weight_to_fp16, x = memory_11_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor var_965 = const()[name = tensor("op_965"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_11_cast_fp16 = reshape(shape = var_965, x = linear_28_cast_fp16)[name = tensor("kv_11_cast_fp16")]; tensor var_969_begin_0 = const()[name = tensor("op_969_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_969_end_0 = const()[name = tensor("op_969_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_969_end_mask_0 = const()[name = tensor("op_969_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_969_squeeze_mask_0 = const()[name = tensor("op_969_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_969_cast_fp16 = slice_by_index(begin = var_969_begin_0, end = var_969_end_0, end_mask = var_969_end_mask_0, squeeze_mask = var_969_squeeze_mask_0, x = kv_11_cast_fp16)[name = tensor("op_969_cast_fp16")]; tensor var_973_begin_0 = const()[name = tensor("op_973_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_973_end_0 = const()[name = tensor("op_973_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_973_end_mask_0 = const()[name = tensor("op_973_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_973_squeeze_mask_0 = const()[name = tensor("op_973_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_973_cast_fp16 = slice_by_index(begin = var_973_begin_0, end = var_973_end_0, end_mask = var_973_end_mask_0, squeeze_mask = var_973_squeeze_mask_0, x = kv_11_cast_fp16)[name = tensor("op_973_cast_fp16")]; tensor v_23_perm_0 = const()[name = tensor("v_23_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_976_transpose_x_0 = const()[name = tensor("op_976_transpose_x_0"), val = tensor(false)]; tensor var_976_transpose_y_0 = const()[name = tensor("op_976_transpose_y_0"), val = tensor(false)]; tensor transpose_88_perm_0 = const()[name = tensor("transpose_88_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_89_perm_0 = const()[name = tensor("transpose_89_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_89 = transpose(perm = transpose_89_perm_0, x = var_969_cast_fp16)[name = tensor("transpose_163")]; tensor transpose_88 = transpose(perm = transpose_88_perm_0, x = var_961_cast_fp16)[name = tensor("transpose_164")]; tensor var_976_cast_fp16 = matmul(transpose_x = var_976_transpose_x_0, transpose_y = var_976_transpose_y_0, x = transpose_88, y = transpose_89)[name = tensor("op_976_cast_fp16")]; tensor var_977_to_fp16 = const()[name = tensor("op_977_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_45_cast_fp16 = mul(x = var_976_cast_fp16, y = var_977_to_fp16)[name = tensor("attn_45_cast_fp16")]; tensor var_875_to_fp16 = const()[name = tensor("op_875_to_fp16"), val = tensor(-inf)]; tensor input_111_cast_fp16 = select(a = var_875_to_fp16, b = attn_45_cast_fp16, cond = var_151)[name = tensor("input_111_cast_fp16")]; tensor attn_47_cast_fp16 = softmax(axis = var_884, x = input_111_cast_fp16)[name = tensor("attn_47_cast_fp16")]; tensor out_23_transpose_x_0 = const()[name = tensor("out_23_transpose_x_0"), val = tensor(false)]; tensor out_23_transpose_y_0 = const()[name = tensor("out_23_transpose_y_0"), val = tensor(false)]; tensor v_23_cast_fp16 = transpose(perm = v_23_perm_0, x = var_973_cast_fp16)[name = tensor("transpose_165")]; tensor out_23_cast_fp16 = matmul(transpose_x = out_23_transpose_x_0, transpose_y = out_23_transpose_y_0, x = attn_47_cast_fp16, y = v_23_cast_fp16)[name = tensor("out_23_cast_fp16")]; tensor var_985_perm_0 = const()[name = tensor("op_985_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_986 = const()[name = tensor("op_986"), val = tensor([1, 110, -1])]; tensor var_985_cast_fp16 = transpose(perm = var_985_perm_0, x = out_23_cast_fp16)[name = tensor("transpose_162")]; tensor input_113_cast_fp16 = reshape(shape = var_986, x = var_985_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor layers_5_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_5_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80283520)))]; tensor linear_29_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_5_cross_attn_o_proj_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor input_115_cast_fp16 = add(x = input_109_cast_fp16, y = linear_29_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor x_55_axes_0 = const()[name = tensor("x_55_axes_0"), val = tensor([-1])]; tensor layers_5_norm_ff_weight_to_fp16 = const()[name = tensor("layers_5_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80480192)))]; tensor x_55_cast_fp16 = layer_norm(axes = x_55_axes_0, epsilon = var_891_to_fp16, gamma = layers_5_norm_ff_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor input_117_perm_0 = const()[name = tensor("input_117_perm_0"), val = tensor([0, 2, 1])]; tensor input_119_pad_type_0 = const()[name = tensor("input_119_pad_type_0"), val = tensor("valid")]; tensor input_119_strides_0 = const()[name = tensor("input_119_strides_0"), val = tensor([1])]; tensor input_119_pad_0 = const()[name = tensor("input_119_pad_0"), val = tensor([0, 0])]; tensor input_119_dilations_0 = const()[name = tensor("input_119_dilations_0"), val = tensor([1])]; tensor input_119_groups_0 = const()[name = tensor("input_119_groups_0"), val = tensor(1)]; tensor layers_5_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_5_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80481792)))]; tensor input_117_cast_fp16 = transpose(perm = input_117_perm_0, x = x_55_cast_fp16)[name = tensor("transpose_161")]; tensor input_119_cast_fp16 = conv(dilations = input_119_dilations_0, groups = input_119_groups_0, pad = input_119_pad_0, pad_type = input_119_pad_type_0, strides = input_119_strides_0, weight = layers_5_ffn_conv1_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("input_119_cast_fp16")]; tensor input_121_mode_0 = const()[name = tensor("input_121_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_121_cast_fp16 = gelu(mode = input_121_mode_0, x = input_119_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor x_57_pad_type_0 = const()[name = tensor("x_57_pad_type_0"), val = tensor("valid")]; tensor x_57_strides_0 = const()[name = tensor("x_57_strides_0"), val = tensor([1])]; tensor x_57_pad_0 = const()[name = tensor("x_57_pad_0"), val = tensor([0, 0])]; tensor x_57_dilations_0 = const()[name = tensor("x_57_dilations_0"), val = tensor([1])]; tensor x_57_groups_0 = const()[name = tensor("x_57_groups_0"), val = tensor(1)]; tensor layers_5_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_5_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85200448)))]; tensor x_57_cast_fp16 = conv(dilations = x_57_dilations_0, groups = x_57_groups_0, pad = x_57_pad_0, pad_type = x_57_pad_type_0, strides = x_57_strides_0, weight = layers_5_ffn_conv2_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("x_57_cast_fp16")]; tensor x_59_perm_0 = const()[name = tensor("x_59_perm_0"), val = tensor([0, 2, 1])]; tensor x_59_cast_fp16 = transpose(perm = x_59_perm_0, x = x_57_cast_fp16)[name = tensor("transpose_160")]; tensor input_123_cast_fp16 = add(x = input_115_cast_fp16, y = x_59_cast_fp16)[name = tensor("input_123_cast_fp16")]; tensor k_padded_11_pad_0 = const()[name = tensor("k_padded_11_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_11_mode_0 = const()[name = tensor("k_padded_11_mode_0"), val = tensor("constant")]; tensor const_42_to_fp16 = const()[name = tensor("const_42_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_11_cast_fp16 = pad(constant_val = const_42_to_fp16, mode = k_padded_11_mode_0, pad = k_padded_11_pad_0, x = k_21_cast_fp16)[name = tensor("k_padded_11_cast_fp16")]; tensor v_padded_11_pad_0 = const()[name = tensor("v_padded_11_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_11_mode_0 = const()[name = tensor("v_padded_11_mode_0"), val = tensor("constant")]; tensor const_43_to_fp16 = const()[name = tensor("const_43_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_11_cast_fp16 = pad(constant_val = const_43_to_fp16, mode = v_padded_11_mode_0, pad = v_padded_11_pad_0, x = v_21_cast_fp16)[name = tensor("v_padded_11_cast_fp16")]; tensor var_1038_axis_0 = const()[name = tensor("op_1038_axis_0"), val = tensor(0)]; tensor var_1038 = stack(axis = var_1038_axis_0, values = (k_padded_11_cast_fp16, v_padded_11_cast_fp16))[name = tensor("op_1038_cast_fp16")]; tensor var_1050 = const()[name = tensor("op_1050"), val = tensor(-1)]; tensor x_61_axes_0 = const()[name = tensor("x_61_axes_0"), val = tensor([-1])]; tensor layers_6_norm_sa_weight_to_fp16 = const()[name = tensor("layers_6_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89919104)))]; tensor var_1057_to_fp16 = const()[name = tensor("op_1057_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_61_cast_fp16 = layer_norm(axes = x_61_axes_0, epsilon = var_1057_to_fp16, gamma = layers_6_norm_sa_weight_to_fp16, x = input_123_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor layers_6_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_6_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89920704)))]; tensor linear_30_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_6_self_attn_qkv_proj_weight_to_fp16, x = x_61_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_1075 = const()[name = tensor("op_1075"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_13_cast_fp16 = reshape(shape = var_1075, x = linear_30_cast_fp16)[name = tensor("qkv_13_cast_fp16")]; tensor q_37_begin_0 = const()[name = tensor("q_37_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_37_end_0 = const()[name = tensor("q_37_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_37_end_mask_0 = const()[name = tensor("q_37_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_37_squeeze_mask_0 = const()[name = tensor("q_37_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_37_cast_fp16 = slice_by_index(begin = q_37_begin_0, end = q_37_end_0, end_mask = q_37_end_mask_0, squeeze_mask = q_37_squeeze_mask_0, x = qkv_13_cast_fp16)[name = tensor("q_37_cast_fp16")]; tensor k_25_begin_0 = const()[name = tensor("k_25_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_25_end_0 = const()[name = tensor("k_25_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_25_end_mask_0 = const()[name = tensor("k_25_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_25_squeeze_mask_0 = const()[name = tensor("k_25_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_25_cast_fp16 = slice_by_index(begin = k_25_begin_0, end = k_25_end_0, end_mask = k_25_end_mask_0, squeeze_mask = k_25_squeeze_mask_0, x = qkv_13_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor v_25_begin_0 = const()[name = tensor("v_25_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_25_end_0 = const()[name = tensor("v_25_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_25_end_mask_0 = const()[name = tensor("v_25_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_25_squeeze_mask_0 = const()[name = tensor("v_25_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_25_cast_fp16 = slice_by_index(begin = v_25_begin_0, end = v_25_end_0, end_mask = v_25_end_mask_0, squeeze_mask = v_25_squeeze_mask_0, x = qkv_13_cast_fp16)[name = tensor("v_25_cast_fp16")]; tensor v_t_13_perm_0 = const()[name = tensor("v_t_13_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1090_transpose_x_0 = const()[name = tensor("op_1090_transpose_x_0"), val = tensor(false)]; tensor var_1090_transpose_y_0 = const()[name = tensor("op_1090_transpose_y_0"), val = tensor(false)]; tensor transpose_90_perm_0 = const()[name = tensor("transpose_90_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_91_perm_0 = const()[name = tensor("transpose_91_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_91 = transpose(perm = transpose_91_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_157")]; tensor transpose_90 = transpose(perm = transpose_90_perm_0, x = q_37_cast_fp16)[name = tensor("transpose_158")]; tensor var_1090_cast_fp16 = matmul(transpose_x = var_1090_transpose_x_0, transpose_y = var_1090_transpose_y_0, x = transpose_90, y = transpose_91)[name = tensor("op_1090_cast_fp16")]; tensor var_1091_to_fp16 = const()[name = tensor("op_1091_to_fp16"), val = tensor(0x1p-3)]; tensor attn_49_cast_fp16 = mul(x = var_1090_cast_fp16, y = var_1091_to_fp16)[name = tensor("attn_49_cast_fp16")]; tensor attn_49_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_49_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_49_cast_fp16_to_fp32 = cast(dtype = attn_49_cast_fp16_to_fp32_dtype_0, x = attn_49_cast_fp16)[name = tensor("cast_81")]; tensor input_125 = add(x = attn_49_cast_fp16_to_fp32, y = var_102)[name = tensor("input_125")]; tensor input_125_to_fp16_dtype_0 = const()[name = tensor("input_125_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_125_to_fp16 = cast(dtype = input_125_to_fp16_dtype_0, x = input_125)[name = tensor("cast_80")]; tensor attn_51_cast_fp16 = softmax(axis = var_1050, x = input_125_to_fp16)[name = tensor("attn_51_cast_fp16")]; tensor out_25_transpose_x_0 = const()[name = tensor("out_25_transpose_x_0"), val = tensor(false)]; tensor out_25_transpose_y_0 = const()[name = tensor("out_25_transpose_y_0"), val = tensor(false)]; tensor v_t_13_cast_fp16 = transpose(perm = v_t_13_perm_0, x = v_25_cast_fp16)[name = tensor("transpose_159")]; tensor out_25_cast_fp16 = matmul(transpose_x = out_25_transpose_x_0, transpose_y = out_25_transpose_y_0, x = attn_51_cast_fp16, y = v_t_13_cast_fp16)[name = tensor("out_25_cast_fp16")]; tensor var_1102_perm_0 = const()[name = tensor("op_1102_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1103 = const()[name = tensor("op_1103"), val = tensor([1, 110, -1])]; tensor var_1102_cast_fp16 = transpose(perm = var_1102_perm_0, x = out_25_cast_fp16)[name = tensor("transpose_156")]; tensor input_127_cast_fp16 = reshape(shape = var_1103, x = var_1102_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor layers_6_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_6_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93459712)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_6_self_attn_o_proj_weight_to_fp16, x = input_127_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor input_129_cast_fp16 = add(x = input_123_cast_fp16, y = linear_31_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor x_63_axes_0 = const()[name = tensor("x_63_axes_0"), val = tensor([-1])]; tensor layers_6_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_6_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94639424)))]; tensor x_63_cast_fp16 = layer_norm(axes = x_63_axes_0, epsilon = var_1057_to_fp16, gamma = layers_6_norm_xa_query_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("x_63_cast_fp16")]; tensor memory_13_axes_0 = const()[name = tensor("memory_13_axes_0"), val = tensor([-1])]; tensor layers_6_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_6_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94641024)))]; tensor memory_13_cast_fp16 = layer_norm(axes = memory_13_axes_0, epsilon = var_1057_to_fp16, gamma = layers_6_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_13_cast_fp16")]; tensor layers_6_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_6_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94642624)))]; tensor linear_32_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_6_cross_attn_q_proj_weight_to_fp16, x = x_63_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_1126 = const()[name = tensor("op_1126"), val = tensor([1, 110, 1, 128])]; tensor var_1127_cast_fp16 = reshape(shape = var_1126, x = linear_32_cast_fp16)[name = tensor("op_1127_cast_fp16")]; tensor layers_6_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_6_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94839296)))]; tensor linear_33_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_6_cross_attn_kv_proj_weight_to_fp16, x = memory_13_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor var_1131 = const()[name = tensor("op_1131"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_13_cast_fp16 = reshape(shape = var_1131, x = linear_33_cast_fp16)[name = tensor("kv_13_cast_fp16")]; tensor var_1135_begin_0 = const()[name = tensor("op_1135_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1135_end_0 = const()[name = tensor("op_1135_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_1135_end_mask_0 = const()[name = tensor("op_1135_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1135_squeeze_mask_0 = const()[name = tensor("op_1135_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1135_cast_fp16 = slice_by_index(begin = var_1135_begin_0, end = var_1135_end_0, end_mask = var_1135_end_mask_0, squeeze_mask = var_1135_squeeze_mask_0, x = kv_13_cast_fp16)[name = tensor("op_1135_cast_fp16")]; tensor var_1139_begin_0 = const()[name = tensor("op_1139_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_1139_end_0 = const()[name = tensor("op_1139_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_1139_end_mask_0 = const()[name = tensor("op_1139_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1139_squeeze_mask_0 = const()[name = tensor("op_1139_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1139_cast_fp16 = slice_by_index(begin = var_1139_begin_0, end = var_1139_end_0, end_mask = var_1139_end_mask_0, squeeze_mask = var_1139_squeeze_mask_0, x = kv_13_cast_fp16)[name = tensor("op_1139_cast_fp16")]; tensor v_27_perm_0 = const()[name = tensor("v_27_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1142_transpose_x_0 = const()[name = tensor("op_1142_transpose_x_0"), val = tensor(false)]; tensor var_1142_transpose_y_0 = const()[name = tensor("op_1142_transpose_y_0"), val = tensor(false)]; tensor transpose_92_perm_0 = const()[name = tensor("transpose_92_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_93_perm_0 = const()[name = tensor("transpose_93_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_93 = transpose(perm = transpose_93_perm_0, x = var_1135_cast_fp16)[name = tensor("transpose_153")]; tensor transpose_92 = transpose(perm = transpose_92_perm_0, x = var_1127_cast_fp16)[name = tensor("transpose_154")]; tensor var_1142_cast_fp16 = matmul(transpose_x = var_1142_transpose_x_0, transpose_y = var_1142_transpose_y_0, x = transpose_92, y = transpose_93)[name = tensor("op_1142_cast_fp16")]; tensor var_1143_to_fp16 = const()[name = tensor("op_1143_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_53_cast_fp16 = mul(x = var_1142_cast_fp16, y = var_1143_to_fp16)[name = tensor("attn_53_cast_fp16")]; tensor var_1041_to_fp16 = const()[name = tensor("op_1041_to_fp16"), val = tensor(-inf)]; tensor input_131_cast_fp16 = select(a = var_1041_to_fp16, b = attn_53_cast_fp16, cond = var_151)[name = tensor("input_131_cast_fp16")]; tensor attn_55_cast_fp16 = softmax(axis = var_1050, x = input_131_cast_fp16)[name = tensor("attn_55_cast_fp16")]; tensor out_27_transpose_x_0 = const()[name = tensor("out_27_transpose_x_0"), val = tensor(false)]; tensor out_27_transpose_y_0 = const()[name = tensor("out_27_transpose_y_0"), val = tensor(false)]; tensor v_27_cast_fp16 = transpose(perm = v_27_perm_0, x = var_1139_cast_fp16)[name = tensor("transpose_155")]; tensor out_27_cast_fp16 = matmul(transpose_x = out_27_transpose_x_0, transpose_y = out_27_transpose_y_0, x = attn_55_cast_fp16, y = v_27_cast_fp16)[name = tensor("out_27_cast_fp16")]; tensor var_1151_perm_0 = const()[name = tensor("op_1151_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1152 = const()[name = tensor("op_1152"), val = tensor([1, 110, -1])]; tensor var_1151_cast_fp16 = transpose(perm = var_1151_perm_0, x = out_27_cast_fp16)[name = tensor("transpose_152")]; tensor input_133_cast_fp16 = reshape(shape = var_1152, x = var_1151_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor layers_6_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_6_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95232576)))]; tensor linear_34_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_6_cross_attn_o_proj_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_135_cast_fp16 = add(x = input_129_cast_fp16, y = linear_34_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor x_65_axes_0 = const()[name = tensor("x_65_axes_0"), val = tensor([-1])]; tensor layers_6_norm_ff_weight_to_fp16 = const()[name = tensor("layers_6_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95429248)))]; tensor x_65_cast_fp16 = layer_norm(axes = x_65_axes_0, epsilon = var_1057_to_fp16, gamma = layers_6_norm_ff_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor input_137_perm_0 = const()[name = tensor("input_137_perm_0"), val = tensor([0, 2, 1])]; tensor input_139_pad_type_0 = const()[name = tensor("input_139_pad_type_0"), val = tensor("valid")]; tensor input_139_strides_0 = const()[name = tensor("input_139_strides_0"), val = tensor([1])]; tensor input_139_pad_0 = const()[name = tensor("input_139_pad_0"), val = tensor([0, 0])]; tensor input_139_dilations_0 = const()[name = tensor("input_139_dilations_0"), val = tensor([1])]; tensor input_139_groups_0 = const()[name = tensor("input_139_groups_0"), val = tensor(1)]; tensor layers_6_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_6_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95430848)))]; tensor input_137_cast_fp16 = transpose(perm = input_137_perm_0, x = x_65_cast_fp16)[name = tensor("transpose_151")]; tensor input_139_cast_fp16 = conv(dilations = input_139_dilations_0, groups = input_139_groups_0, pad = input_139_pad_0, pad_type = input_139_pad_type_0, strides = input_139_strides_0, weight = layers_6_ffn_conv1_weight_to_fp16, x = input_137_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor input_141_mode_0 = const()[name = tensor("input_141_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_141_cast_fp16 = gelu(mode = input_141_mode_0, x = input_139_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor x_67_pad_type_0 = const()[name = tensor("x_67_pad_type_0"), val = tensor("valid")]; tensor x_67_strides_0 = const()[name = tensor("x_67_strides_0"), val = tensor([1])]; tensor x_67_pad_0 = const()[name = tensor("x_67_pad_0"), val = tensor([0, 0])]; tensor x_67_dilations_0 = const()[name = tensor("x_67_dilations_0"), val = tensor([1])]; tensor x_67_groups_0 = const()[name = tensor("x_67_groups_0"), val = tensor(1)]; tensor layers_6_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_6_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100149504)))]; tensor x_67_cast_fp16 = conv(dilations = x_67_dilations_0, groups = x_67_groups_0, pad = x_67_pad_0, pad_type = x_67_pad_type_0, strides = x_67_strides_0, weight = layers_6_ffn_conv2_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("x_67_cast_fp16")]; tensor x_69_perm_0 = const()[name = tensor("x_69_perm_0"), val = tensor([0, 2, 1])]; tensor x_69_cast_fp16 = transpose(perm = x_69_perm_0, x = x_67_cast_fp16)[name = tensor("transpose_150")]; tensor input_143_cast_fp16 = add(x = input_135_cast_fp16, y = x_69_cast_fp16)[name = tensor("input_143_cast_fp16")]; tensor k_padded_13_pad_0 = const()[name = tensor("k_padded_13_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_13_mode_0 = const()[name = tensor("k_padded_13_mode_0"), val = tensor("constant")]; tensor const_49_to_fp16 = const()[name = tensor("const_49_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_13_cast_fp16 = pad(constant_val = const_49_to_fp16, mode = k_padded_13_mode_0, pad = k_padded_13_pad_0, x = k_25_cast_fp16)[name = tensor("k_padded_13_cast_fp16")]; tensor v_padded_13_pad_0 = const()[name = tensor("v_padded_13_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_13_mode_0 = const()[name = tensor("v_padded_13_mode_0"), val = tensor("constant")]; tensor const_50_to_fp16 = const()[name = tensor("const_50_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_13_cast_fp16 = pad(constant_val = const_50_to_fp16, mode = v_padded_13_mode_0, pad = v_padded_13_pad_0, x = v_25_cast_fp16)[name = tensor("v_padded_13_cast_fp16")]; tensor var_1204_axis_0 = const()[name = tensor("op_1204_axis_0"), val = tensor(0)]; tensor var_1204 = stack(axis = var_1204_axis_0, values = (k_padded_13_cast_fp16, v_padded_13_cast_fp16))[name = tensor("op_1204_cast_fp16")]; tensor var_1216 = const()[name = tensor("op_1216"), val = tensor(-1)]; tensor x_71_axes_0 = const()[name = tensor("x_71_axes_0"), val = tensor([-1])]; tensor layers_7_norm_sa_weight_to_fp16 = const()[name = tensor("layers_7_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104868160)))]; tensor var_1223_to_fp16 = const()[name = tensor("op_1223_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_71_cast_fp16 = layer_norm(axes = x_71_axes_0, epsilon = var_1223_to_fp16, gamma = layers_7_norm_sa_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("x_71_cast_fp16")]; tensor layers_7_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_7_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104869760)))]; tensor linear_35_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_7_self_attn_qkv_proj_weight_to_fp16, x = x_71_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor var_1241 = const()[name = tensor("op_1241"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_15_cast_fp16 = reshape(shape = var_1241, x = linear_35_cast_fp16)[name = tensor("qkv_15_cast_fp16")]; tensor q_43_begin_0 = const()[name = tensor("q_43_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_43_end_0 = const()[name = tensor("q_43_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_43_end_mask_0 = const()[name = tensor("q_43_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_43_squeeze_mask_0 = const()[name = tensor("q_43_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_43_cast_fp16 = slice_by_index(begin = q_43_begin_0, end = q_43_end_0, end_mask = q_43_end_mask_0, squeeze_mask = q_43_squeeze_mask_0, x = qkv_15_cast_fp16)[name = tensor("q_43_cast_fp16")]; tensor k_29_begin_0 = const()[name = tensor("k_29_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_29_end_0 = const()[name = tensor("k_29_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_29_end_mask_0 = const()[name = tensor("k_29_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_29_squeeze_mask_0 = const()[name = tensor("k_29_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_29_cast_fp16 = slice_by_index(begin = k_29_begin_0, end = k_29_end_0, end_mask = k_29_end_mask_0, squeeze_mask = k_29_squeeze_mask_0, x = qkv_15_cast_fp16)[name = tensor("k_29_cast_fp16")]; tensor v_29_begin_0 = const()[name = tensor("v_29_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_29_end_0 = const()[name = tensor("v_29_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_29_end_mask_0 = const()[name = tensor("v_29_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_29_squeeze_mask_0 = const()[name = tensor("v_29_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_29_cast_fp16 = slice_by_index(begin = v_29_begin_0, end = v_29_end_0, end_mask = v_29_end_mask_0, squeeze_mask = v_29_squeeze_mask_0, x = qkv_15_cast_fp16)[name = tensor("v_29_cast_fp16")]; tensor v_t_15_perm_0 = const()[name = tensor("v_t_15_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1256_transpose_x_0 = const()[name = tensor("op_1256_transpose_x_0"), val = tensor(false)]; tensor var_1256_transpose_y_0 = const()[name = tensor("op_1256_transpose_y_0"), val = tensor(false)]; tensor transpose_94_perm_0 = const()[name = tensor("transpose_94_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_95_perm_0 = const()[name = tensor("transpose_95_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_95 = transpose(perm = transpose_95_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_147")]; tensor transpose_94 = transpose(perm = transpose_94_perm_0, x = q_43_cast_fp16)[name = tensor("transpose_148")]; tensor var_1256_cast_fp16 = matmul(transpose_x = var_1256_transpose_x_0, transpose_y = var_1256_transpose_y_0, x = transpose_94, y = transpose_95)[name = tensor("op_1256_cast_fp16")]; tensor var_1257_to_fp16 = const()[name = tensor("op_1257_to_fp16"), val = tensor(0x1p-3)]; tensor attn_57_cast_fp16 = mul(x = var_1256_cast_fp16, y = var_1257_to_fp16)[name = tensor("attn_57_cast_fp16")]; tensor attn_57_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_57_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_57_cast_fp16_to_fp32 = cast(dtype = attn_57_cast_fp16_to_fp32_dtype_0, x = attn_57_cast_fp16)[name = tensor("cast_79")]; tensor input_145 = add(x = attn_57_cast_fp16_to_fp32, y = var_102)[name = tensor("input_145")]; tensor input_145_to_fp16_dtype_0 = const()[name = tensor("input_145_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_145_to_fp16 = cast(dtype = input_145_to_fp16_dtype_0, x = input_145)[name = tensor("cast_78")]; tensor attn_59_cast_fp16 = softmax(axis = var_1216, x = input_145_to_fp16)[name = tensor("attn_59_cast_fp16")]; tensor out_29_transpose_x_0 = const()[name = tensor("out_29_transpose_x_0"), val = tensor(false)]; tensor out_29_transpose_y_0 = const()[name = tensor("out_29_transpose_y_0"), val = tensor(false)]; tensor v_t_15_cast_fp16 = transpose(perm = v_t_15_perm_0, x = v_29_cast_fp16)[name = tensor("transpose_149")]; tensor out_29_cast_fp16 = matmul(transpose_x = out_29_transpose_x_0, transpose_y = out_29_transpose_y_0, x = attn_59_cast_fp16, y = v_t_15_cast_fp16)[name = tensor("out_29_cast_fp16")]; tensor var_1268_perm_0 = const()[name = tensor("op_1268_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1269 = const()[name = tensor("op_1269"), val = tensor([1, 110, -1])]; tensor var_1268_cast_fp16 = transpose(perm = var_1268_perm_0, x = out_29_cast_fp16)[name = tensor("transpose_146")]; tensor input_147_cast_fp16 = reshape(shape = var_1269, x = var_1268_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor layers_7_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_7_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108408768)))]; tensor linear_36_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_7_self_attn_o_proj_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor input_149_cast_fp16 = add(x = input_143_cast_fp16, y = linear_36_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor x_73_axes_0 = const()[name = tensor("x_73_axes_0"), val = tensor([-1])]; tensor layers_7_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_7_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109588480)))]; tensor x_73_cast_fp16 = layer_norm(axes = x_73_axes_0, epsilon = var_1223_to_fp16, gamma = layers_7_norm_xa_query_weight_to_fp16, x = input_149_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor memory_15_axes_0 = const()[name = tensor("memory_15_axes_0"), val = tensor([-1])]; tensor layers_7_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_7_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109590080)))]; tensor memory_15_cast_fp16 = layer_norm(axes = memory_15_axes_0, epsilon = var_1223_to_fp16, gamma = layers_7_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_15_cast_fp16")]; tensor layers_7_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_7_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109591680)))]; tensor linear_37_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_7_cross_attn_q_proj_weight_to_fp16, x = x_73_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor var_1292 = const()[name = tensor("op_1292"), val = tensor([1, 110, 1, 128])]; tensor var_1293_cast_fp16 = reshape(shape = var_1292, x = linear_37_cast_fp16)[name = tensor("op_1293_cast_fp16")]; tensor layers_7_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_7_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109788352)))]; tensor linear_38_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_7_cross_attn_kv_proj_weight_to_fp16, x = memory_15_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_1297 = const()[name = tensor("op_1297"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_15_cast_fp16 = reshape(shape = var_1297, x = linear_38_cast_fp16)[name = tensor("kv_15_cast_fp16")]; tensor var_1301_begin_0 = const()[name = tensor("op_1301_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1301_end_0 = const()[name = tensor("op_1301_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_1301_end_mask_0 = const()[name = tensor("op_1301_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1301_squeeze_mask_0 = const()[name = tensor("op_1301_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1301_cast_fp16 = slice_by_index(begin = var_1301_begin_0, end = var_1301_end_0, end_mask = var_1301_end_mask_0, squeeze_mask = var_1301_squeeze_mask_0, x = kv_15_cast_fp16)[name = tensor("op_1301_cast_fp16")]; tensor var_1305_begin_0 = const()[name = tensor("op_1305_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_1305_end_0 = const()[name = tensor("op_1305_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_1305_end_mask_0 = const()[name = tensor("op_1305_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1305_squeeze_mask_0 = const()[name = tensor("op_1305_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1305_cast_fp16 = slice_by_index(begin = var_1305_begin_0, end = var_1305_end_0, end_mask = var_1305_end_mask_0, squeeze_mask = var_1305_squeeze_mask_0, x = kv_15_cast_fp16)[name = tensor("op_1305_cast_fp16")]; tensor v_31_perm_0 = const()[name = tensor("v_31_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1308_transpose_x_0 = const()[name = tensor("op_1308_transpose_x_0"), val = tensor(false)]; tensor var_1308_transpose_y_0 = const()[name = tensor("op_1308_transpose_y_0"), val = tensor(false)]; tensor transpose_96_perm_0 = const()[name = tensor("transpose_96_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_97_perm_0 = const()[name = tensor("transpose_97_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_97 = transpose(perm = transpose_97_perm_0, x = var_1301_cast_fp16)[name = tensor("transpose_143")]; tensor transpose_96 = transpose(perm = transpose_96_perm_0, x = var_1293_cast_fp16)[name = tensor("transpose_144")]; tensor var_1308_cast_fp16 = matmul(transpose_x = var_1308_transpose_x_0, transpose_y = var_1308_transpose_y_0, x = transpose_96, y = transpose_97)[name = tensor("op_1308_cast_fp16")]; tensor var_1309_to_fp16 = const()[name = tensor("op_1309_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_61_cast_fp16 = mul(x = var_1308_cast_fp16, y = var_1309_to_fp16)[name = tensor("attn_61_cast_fp16")]; tensor var_1207_to_fp16 = const()[name = tensor("op_1207_to_fp16"), val = tensor(-inf)]; tensor input_151_cast_fp16 = select(a = var_1207_to_fp16, b = attn_61_cast_fp16, cond = var_151)[name = tensor("input_151_cast_fp16")]; tensor attn_63_cast_fp16 = softmax(axis = var_1216, x = input_151_cast_fp16)[name = tensor("attn_63_cast_fp16")]; tensor out_31_transpose_x_0 = const()[name = tensor("out_31_transpose_x_0"), val = tensor(false)]; tensor out_31_transpose_y_0 = const()[name = tensor("out_31_transpose_y_0"), val = tensor(false)]; tensor v_31_cast_fp16 = transpose(perm = v_31_perm_0, x = var_1305_cast_fp16)[name = tensor("transpose_145")]; tensor out_31_cast_fp16 = matmul(transpose_x = out_31_transpose_x_0, transpose_y = out_31_transpose_y_0, x = attn_63_cast_fp16, y = v_31_cast_fp16)[name = tensor("out_31_cast_fp16")]; tensor var_1317_perm_0 = const()[name = tensor("op_1317_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1318 = const()[name = tensor("op_1318"), val = tensor([1, 110, -1])]; tensor var_1317_cast_fp16 = transpose(perm = var_1317_perm_0, x = out_31_cast_fp16)[name = tensor("transpose_142")]; tensor input_153_cast_fp16 = reshape(shape = var_1318, x = var_1317_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor layers_7_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_7_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110181632)))]; tensor linear_39_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_7_cross_attn_o_proj_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor input_155_cast_fp16 = add(x = input_149_cast_fp16, y = linear_39_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor x_75_axes_0 = const()[name = tensor("x_75_axes_0"), val = tensor([-1])]; tensor layers_7_norm_ff_weight_to_fp16 = const()[name = tensor("layers_7_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110378304)))]; tensor x_75_cast_fp16 = layer_norm(axes = x_75_axes_0, epsilon = var_1223_to_fp16, gamma = layers_7_norm_ff_weight_to_fp16, x = input_155_cast_fp16)[name = tensor("x_75_cast_fp16")]; tensor input_157_perm_0 = const()[name = tensor("input_157_perm_0"), val = tensor([0, 2, 1])]; tensor input_159_pad_type_0 = const()[name = tensor("input_159_pad_type_0"), val = tensor("valid")]; tensor input_159_strides_0 = const()[name = tensor("input_159_strides_0"), val = tensor([1])]; tensor input_159_pad_0 = const()[name = tensor("input_159_pad_0"), val = tensor([0, 0])]; tensor input_159_dilations_0 = const()[name = tensor("input_159_dilations_0"), val = tensor([1])]; tensor input_159_groups_0 = const()[name = tensor("input_159_groups_0"), val = tensor(1)]; tensor layers_7_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_7_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110379904)))]; tensor input_157_cast_fp16 = transpose(perm = input_157_perm_0, x = x_75_cast_fp16)[name = tensor("transpose_141")]; tensor input_159_cast_fp16 = conv(dilations = input_159_dilations_0, groups = input_159_groups_0, pad = input_159_pad_0, pad_type = input_159_pad_type_0, strides = input_159_strides_0, weight = layers_7_ffn_conv1_weight_to_fp16, x = input_157_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor input_161_mode_0 = const()[name = tensor("input_161_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_161_cast_fp16 = gelu(mode = input_161_mode_0, x = input_159_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor x_77_pad_type_0 = const()[name = tensor("x_77_pad_type_0"), val = tensor("valid")]; tensor x_77_strides_0 = const()[name = tensor("x_77_strides_0"), val = tensor([1])]; tensor x_77_pad_0 = const()[name = tensor("x_77_pad_0"), val = tensor([0, 0])]; tensor x_77_dilations_0 = const()[name = tensor("x_77_dilations_0"), val = tensor([1])]; tensor x_77_groups_0 = const()[name = tensor("x_77_groups_0"), val = tensor(1)]; tensor layers_7_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_7_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115098560)))]; tensor x_77_cast_fp16 = conv(dilations = x_77_dilations_0, groups = x_77_groups_0, pad = x_77_pad_0, pad_type = x_77_pad_type_0, strides = x_77_strides_0, weight = layers_7_ffn_conv2_weight_to_fp16, x = input_161_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor x_79_perm_0 = const()[name = tensor("x_79_perm_0"), val = tensor([0, 2, 1])]; tensor x_79_cast_fp16 = transpose(perm = x_79_perm_0, x = x_77_cast_fp16)[name = tensor("transpose_140")]; tensor input_163_cast_fp16 = add(x = input_155_cast_fp16, y = x_79_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor k_padded_15_pad_0 = const()[name = tensor("k_padded_15_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_15_mode_0 = const()[name = tensor("k_padded_15_mode_0"), val = tensor("constant")]; tensor const_56_to_fp16 = const()[name = tensor("const_56_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_15_cast_fp16 = pad(constant_val = const_56_to_fp16, mode = k_padded_15_mode_0, pad = k_padded_15_pad_0, x = k_29_cast_fp16)[name = tensor("k_padded_15_cast_fp16")]; tensor v_padded_15_pad_0 = const()[name = tensor("v_padded_15_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_15_mode_0 = const()[name = tensor("v_padded_15_mode_0"), val = tensor("constant")]; tensor const_57_to_fp16 = const()[name = tensor("const_57_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_15_cast_fp16 = pad(constant_val = const_57_to_fp16, mode = v_padded_15_mode_0, pad = v_padded_15_pad_0, x = v_29_cast_fp16)[name = tensor("v_padded_15_cast_fp16")]; tensor var_1370_axis_0 = const()[name = tensor("op_1370_axis_0"), val = tensor(0)]; tensor var_1370 = stack(axis = var_1370_axis_0, values = (k_padded_15_cast_fp16, v_padded_15_cast_fp16))[name = tensor("op_1370_cast_fp16")]; tensor var_1382 = const()[name = tensor("op_1382"), val = tensor(-1)]; tensor x_81_axes_0 = const()[name = tensor("x_81_axes_0"), val = tensor([-1])]; tensor layers_8_norm_sa_weight_to_fp16 = const()[name = tensor("layers_8_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119817216)))]; tensor var_1389_to_fp16 = const()[name = tensor("op_1389_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_81_cast_fp16 = layer_norm(axes = x_81_axes_0, epsilon = var_1389_to_fp16, gamma = layers_8_norm_sa_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("x_81_cast_fp16")]; tensor layers_8_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_8_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119818816)))]; tensor linear_40_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_8_self_attn_qkv_proj_weight_to_fp16, x = x_81_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor var_1407 = const()[name = tensor("op_1407"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_17_cast_fp16 = reshape(shape = var_1407, x = linear_40_cast_fp16)[name = tensor("qkv_17_cast_fp16")]; tensor q_49_begin_0 = const()[name = tensor("q_49_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_49_end_0 = const()[name = tensor("q_49_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_49_end_mask_0 = const()[name = tensor("q_49_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_49_squeeze_mask_0 = const()[name = tensor("q_49_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_49_cast_fp16 = slice_by_index(begin = q_49_begin_0, end = q_49_end_0, end_mask = q_49_end_mask_0, squeeze_mask = q_49_squeeze_mask_0, x = qkv_17_cast_fp16)[name = tensor("q_49_cast_fp16")]; tensor k_33_begin_0 = const()[name = tensor("k_33_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_33_end_0 = const()[name = tensor("k_33_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_33_end_mask_0 = const()[name = tensor("k_33_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_33_squeeze_mask_0 = const()[name = tensor("k_33_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_33_cast_fp16 = slice_by_index(begin = k_33_begin_0, end = k_33_end_0, end_mask = k_33_end_mask_0, squeeze_mask = k_33_squeeze_mask_0, x = qkv_17_cast_fp16)[name = tensor("k_33_cast_fp16")]; tensor v_33_begin_0 = const()[name = tensor("v_33_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_33_end_0 = const()[name = tensor("v_33_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_33_end_mask_0 = const()[name = tensor("v_33_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_33_squeeze_mask_0 = const()[name = tensor("v_33_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_33_cast_fp16 = slice_by_index(begin = v_33_begin_0, end = v_33_end_0, end_mask = v_33_end_mask_0, squeeze_mask = v_33_squeeze_mask_0, x = qkv_17_cast_fp16)[name = tensor("v_33_cast_fp16")]; tensor v_t_17_perm_0 = const()[name = tensor("v_t_17_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1422_transpose_x_0 = const()[name = tensor("op_1422_transpose_x_0"), val = tensor(false)]; tensor var_1422_transpose_y_0 = const()[name = tensor("op_1422_transpose_y_0"), val = tensor(false)]; tensor transpose_98_perm_0 = const()[name = tensor("transpose_98_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_99_perm_0 = const()[name = tensor("transpose_99_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_99 = transpose(perm = transpose_99_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_137")]; tensor transpose_98 = transpose(perm = transpose_98_perm_0, x = q_49_cast_fp16)[name = tensor("transpose_138")]; tensor var_1422_cast_fp16 = matmul(transpose_x = var_1422_transpose_x_0, transpose_y = var_1422_transpose_y_0, x = transpose_98, y = transpose_99)[name = tensor("op_1422_cast_fp16")]; tensor var_1423_to_fp16 = const()[name = tensor("op_1423_to_fp16"), val = tensor(0x1p-3)]; tensor attn_65_cast_fp16 = mul(x = var_1422_cast_fp16, y = var_1423_to_fp16)[name = tensor("attn_65_cast_fp16")]; tensor attn_65_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_65_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_65_cast_fp16_to_fp32 = cast(dtype = attn_65_cast_fp16_to_fp32_dtype_0, x = attn_65_cast_fp16)[name = tensor("cast_77")]; tensor input_165 = add(x = attn_65_cast_fp16_to_fp32, y = var_102)[name = tensor("input_165")]; tensor input_165_to_fp16_dtype_0 = const()[name = tensor("input_165_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_165_to_fp16 = cast(dtype = input_165_to_fp16_dtype_0, x = input_165)[name = tensor("cast_76")]; tensor attn_67_cast_fp16 = softmax(axis = var_1382, x = input_165_to_fp16)[name = tensor("attn_67_cast_fp16")]; tensor out_33_transpose_x_0 = const()[name = tensor("out_33_transpose_x_0"), val = tensor(false)]; tensor out_33_transpose_y_0 = const()[name = tensor("out_33_transpose_y_0"), val = tensor(false)]; tensor v_t_17_cast_fp16 = transpose(perm = v_t_17_perm_0, x = v_33_cast_fp16)[name = tensor("transpose_139")]; tensor out_33_cast_fp16 = matmul(transpose_x = out_33_transpose_x_0, transpose_y = out_33_transpose_y_0, x = attn_67_cast_fp16, y = v_t_17_cast_fp16)[name = tensor("out_33_cast_fp16")]; tensor var_1434_perm_0 = const()[name = tensor("op_1434_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1435 = const()[name = tensor("op_1435"), val = tensor([1, 110, -1])]; tensor var_1434_cast_fp16 = transpose(perm = var_1434_perm_0, x = out_33_cast_fp16)[name = tensor("transpose_136")]; tensor input_167_cast_fp16 = reshape(shape = var_1435, x = var_1434_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor layers_8_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_8_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(123357824)))]; tensor linear_41_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_8_self_attn_o_proj_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor input_169_cast_fp16 = add(x = input_163_cast_fp16, y = linear_41_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor x_83_axes_0 = const()[name = tensor("x_83_axes_0"), val = tensor([-1])]; tensor layers_8_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_8_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124537536)))]; tensor x_83_cast_fp16 = layer_norm(axes = x_83_axes_0, epsilon = var_1389_to_fp16, gamma = layers_8_norm_xa_query_weight_to_fp16, x = input_169_cast_fp16)[name = tensor("x_83_cast_fp16")]; tensor memory_17_axes_0 = const()[name = tensor("memory_17_axes_0"), val = tensor([-1])]; tensor layers_8_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_8_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124539136)))]; tensor memory_17_cast_fp16 = layer_norm(axes = memory_17_axes_0, epsilon = var_1389_to_fp16, gamma = layers_8_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_17_cast_fp16")]; tensor layers_8_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_8_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124540736)))]; tensor linear_42_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_8_cross_attn_q_proj_weight_to_fp16, x = x_83_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor var_1458 = const()[name = tensor("op_1458"), val = tensor([1, 110, 1, 128])]; tensor var_1459_cast_fp16 = reshape(shape = var_1458, x = linear_42_cast_fp16)[name = tensor("op_1459_cast_fp16")]; tensor layers_8_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_8_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124737408)))]; tensor linear_43_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_8_cross_attn_kv_proj_weight_to_fp16, x = memory_17_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor var_1463 = const()[name = tensor("op_1463"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_17_cast_fp16 = reshape(shape = var_1463, x = linear_43_cast_fp16)[name = tensor("kv_17_cast_fp16")]; tensor var_1467_begin_0 = const()[name = tensor("op_1467_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1467_end_0 = const()[name = tensor("op_1467_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_1467_end_mask_0 = const()[name = tensor("op_1467_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1467_squeeze_mask_0 = const()[name = tensor("op_1467_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1467_cast_fp16 = slice_by_index(begin = var_1467_begin_0, end = var_1467_end_0, end_mask = var_1467_end_mask_0, squeeze_mask = var_1467_squeeze_mask_0, x = kv_17_cast_fp16)[name = tensor("op_1467_cast_fp16")]; tensor var_1471_begin_0 = const()[name = tensor("op_1471_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_1471_end_0 = const()[name = tensor("op_1471_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_1471_end_mask_0 = const()[name = tensor("op_1471_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1471_squeeze_mask_0 = const()[name = tensor("op_1471_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1471_cast_fp16 = slice_by_index(begin = var_1471_begin_0, end = var_1471_end_0, end_mask = var_1471_end_mask_0, squeeze_mask = var_1471_squeeze_mask_0, x = kv_17_cast_fp16)[name = tensor("op_1471_cast_fp16")]; tensor v_35_perm_0 = const()[name = tensor("v_35_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1474_transpose_x_0 = const()[name = tensor("op_1474_transpose_x_0"), val = tensor(false)]; tensor var_1474_transpose_y_0 = const()[name = tensor("op_1474_transpose_y_0"), val = tensor(false)]; tensor transpose_100_perm_0 = const()[name = tensor("transpose_100_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_101_perm_0 = const()[name = tensor("transpose_101_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_101 = transpose(perm = transpose_101_perm_0, x = var_1467_cast_fp16)[name = tensor("transpose_133")]; tensor transpose_100 = transpose(perm = transpose_100_perm_0, x = var_1459_cast_fp16)[name = tensor("transpose_134")]; tensor var_1474_cast_fp16 = matmul(transpose_x = var_1474_transpose_x_0, transpose_y = var_1474_transpose_y_0, x = transpose_100, y = transpose_101)[name = tensor("op_1474_cast_fp16")]; tensor var_1475_to_fp16 = const()[name = tensor("op_1475_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_69_cast_fp16 = mul(x = var_1474_cast_fp16, y = var_1475_to_fp16)[name = tensor("attn_69_cast_fp16")]; tensor var_1373_to_fp16 = const()[name = tensor("op_1373_to_fp16"), val = tensor(-inf)]; tensor input_171_cast_fp16 = select(a = var_1373_to_fp16, b = attn_69_cast_fp16, cond = var_151)[name = tensor("input_171_cast_fp16")]; tensor attn_71_cast_fp16 = softmax(axis = var_1382, x = input_171_cast_fp16)[name = tensor("attn_71_cast_fp16")]; tensor out_35_transpose_x_0 = const()[name = tensor("out_35_transpose_x_0"), val = tensor(false)]; tensor out_35_transpose_y_0 = const()[name = tensor("out_35_transpose_y_0"), val = tensor(false)]; tensor v_35_cast_fp16 = transpose(perm = v_35_perm_0, x = var_1471_cast_fp16)[name = tensor("transpose_135")]; tensor out_35_cast_fp16 = matmul(transpose_x = out_35_transpose_x_0, transpose_y = out_35_transpose_y_0, x = attn_71_cast_fp16, y = v_35_cast_fp16)[name = tensor("out_35_cast_fp16")]; tensor var_1483_perm_0 = const()[name = tensor("op_1483_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1484 = const()[name = tensor("op_1484"), val = tensor([1, 110, -1])]; tensor var_1483_cast_fp16 = transpose(perm = var_1483_perm_0, x = out_35_cast_fp16)[name = tensor("transpose_132")]; tensor input_173_cast_fp16 = reshape(shape = var_1484, x = var_1483_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor layers_8_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_8_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125130688)))]; tensor linear_44_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_8_cross_attn_o_proj_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor input_175_cast_fp16 = add(x = input_169_cast_fp16, y = linear_44_cast_fp16)[name = tensor("input_175_cast_fp16")]; tensor x_85_axes_0 = const()[name = tensor("x_85_axes_0"), val = tensor([-1])]; tensor layers_8_norm_ff_weight_to_fp16 = const()[name = tensor("layers_8_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125327360)))]; tensor x_85_cast_fp16 = layer_norm(axes = x_85_axes_0, epsilon = var_1389_to_fp16, gamma = layers_8_norm_ff_weight_to_fp16, x = input_175_cast_fp16)[name = tensor("x_85_cast_fp16")]; tensor input_177_perm_0 = const()[name = tensor("input_177_perm_0"), val = tensor([0, 2, 1])]; tensor input_179_pad_type_0 = const()[name = tensor("input_179_pad_type_0"), val = tensor("valid")]; tensor input_179_strides_0 = const()[name = tensor("input_179_strides_0"), val = tensor([1])]; tensor input_179_pad_0 = const()[name = tensor("input_179_pad_0"), val = tensor([0, 0])]; tensor input_179_dilations_0 = const()[name = tensor("input_179_dilations_0"), val = tensor([1])]; tensor input_179_groups_0 = const()[name = tensor("input_179_groups_0"), val = tensor(1)]; tensor layers_8_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_8_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(125328960)))]; tensor input_177_cast_fp16 = transpose(perm = input_177_perm_0, x = x_85_cast_fp16)[name = tensor("transpose_131")]; tensor input_179_cast_fp16 = conv(dilations = input_179_dilations_0, groups = input_179_groups_0, pad = input_179_pad_0, pad_type = input_179_pad_type_0, strides = input_179_strides_0, weight = layers_8_ffn_conv1_weight_to_fp16, x = input_177_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor input_181_mode_0 = const()[name = tensor("input_181_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_181_cast_fp16 = gelu(mode = input_181_mode_0, x = input_179_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor x_87_pad_type_0 = const()[name = tensor("x_87_pad_type_0"), val = tensor("valid")]; tensor x_87_strides_0 = const()[name = tensor("x_87_strides_0"), val = tensor([1])]; tensor x_87_pad_0 = const()[name = tensor("x_87_pad_0"), val = tensor([0, 0])]; tensor x_87_dilations_0 = const()[name = tensor("x_87_dilations_0"), val = tensor([1])]; tensor x_87_groups_0 = const()[name = tensor("x_87_groups_0"), val = tensor(1)]; tensor layers_8_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_8_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130047616)))]; tensor x_87_cast_fp16 = conv(dilations = x_87_dilations_0, groups = x_87_groups_0, pad = x_87_pad_0, pad_type = x_87_pad_type_0, strides = x_87_strides_0, weight = layers_8_ffn_conv2_weight_to_fp16, x = input_181_cast_fp16)[name = tensor("x_87_cast_fp16")]; tensor x_89_perm_0 = const()[name = tensor("x_89_perm_0"), val = tensor([0, 2, 1])]; tensor x_89_cast_fp16 = transpose(perm = x_89_perm_0, x = x_87_cast_fp16)[name = tensor("transpose_130")]; tensor input_183_cast_fp16 = add(x = input_175_cast_fp16, y = x_89_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor k_padded_17_pad_0 = const()[name = tensor("k_padded_17_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_17_mode_0 = const()[name = tensor("k_padded_17_mode_0"), val = tensor("constant")]; tensor const_63_to_fp16 = const()[name = tensor("const_63_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_17_cast_fp16 = pad(constant_val = const_63_to_fp16, mode = k_padded_17_mode_0, pad = k_padded_17_pad_0, x = k_33_cast_fp16)[name = tensor("k_padded_17_cast_fp16")]; tensor v_padded_17_pad_0 = const()[name = tensor("v_padded_17_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_17_mode_0 = const()[name = tensor("v_padded_17_mode_0"), val = tensor("constant")]; tensor const_64_to_fp16 = const()[name = tensor("const_64_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_17_cast_fp16 = pad(constant_val = const_64_to_fp16, mode = v_padded_17_mode_0, pad = v_padded_17_pad_0, x = v_33_cast_fp16)[name = tensor("v_padded_17_cast_fp16")]; tensor var_1536_axis_0 = const()[name = tensor("op_1536_axis_0"), val = tensor(0)]; tensor var_1536 = stack(axis = var_1536_axis_0, values = (k_padded_17_cast_fp16, v_padded_17_cast_fp16))[name = tensor("op_1536_cast_fp16")]; tensor var_1548 = const()[name = tensor("op_1548"), val = tensor(-1)]; tensor x_91_axes_0 = const()[name = tensor("x_91_axes_0"), val = tensor([-1])]; tensor layers_9_norm_sa_weight_to_fp16 = const()[name = tensor("layers_9_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134766272)))]; tensor var_1555_to_fp16 = const()[name = tensor("op_1555_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_91_cast_fp16 = layer_norm(axes = x_91_axes_0, epsilon = var_1555_to_fp16, gamma = layers_9_norm_sa_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("x_91_cast_fp16")]; tensor layers_9_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_9_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134767872)))]; tensor linear_45_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_9_self_attn_qkv_proj_weight_to_fp16, x = x_91_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor var_1573 = const()[name = tensor("op_1573"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_19_cast_fp16 = reshape(shape = var_1573, x = linear_45_cast_fp16)[name = tensor("qkv_19_cast_fp16")]; tensor q_55_begin_0 = const()[name = tensor("q_55_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_55_end_0 = const()[name = tensor("q_55_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_55_end_mask_0 = const()[name = tensor("q_55_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_55_squeeze_mask_0 = const()[name = tensor("q_55_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_55_cast_fp16 = slice_by_index(begin = q_55_begin_0, end = q_55_end_0, end_mask = q_55_end_mask_0, squeeze_mask = q_55_squeeze_mask_0, x = qkv_19_cast_fp16)[name = tensor("q_55_cast_fp16")]; tensor k_37_begin_0 = const()[name = tensor("k_37_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_37_end_0 = const()[name = tensor("k_37_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_37_end_mask_0 = const()[name = tensor("k_37_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_37_squeeze_mask_0 = const()[name = tensor("k_37_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_37_cast_fp16 = slice_by_index(begin = k_37_begin_0, end = k_37_end_0, end_mask = k_37_end_mask_0, squeeze_mask = k_37_squeeze_mask_0, x = qkv_19_cast_fp16)[name = tensor("k_37_cast_fp16")]; tensor v_37_begin_0 = const()[name = tensor("v_37_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_37_end_0 = const()[name = tensor("v_37_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_37_end_mask_0 = const()[name = tensor("v_37_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_37_squeeze_mask_0 = const()[name = tensor("v_37_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_37_cast_fp16 = slice_by_index(begin = v_37_begin_0, end = v_37_end_0, end_mask = v_37_end_mask_0, squeeze_mask = v_37_squeeze_mask_0, x = qkv_19_cast_fp16)[name = tensor("v_37_cast_fp16")]; tensor v_t_19_perm_0 = const()[name = tensor("v_t_19_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1588_transpose_x_0 = const()[name = tensor("op_1588_transpose_x_0"), val = tensor(false)]; tensor var_1588_transpose_y_0 = const()[name = tensor("op_1588_transpose_y_0"), val = tensor(false)]; tensor transpose_102_perm_0 = const()[name = tensor("transpose_102_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_103_perm_0 = const()[name = tensor("transpose_103_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_103 = transpose(perm = transpose_103_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_127")]; tensor transpose_102 = transpose(perm = transpose_102_perm_0, x = q_55_cast_fp16)[name = tensor("transpose_128")]; tensor var_1588_cast_fp16 = matmul(transpose_x = var_1588_transpose_x_0, transpose_y = var_1588_transpose_y_0, x = transpose_102, y = transpose_103)[name = tensor("op_1588_cast_fp16")]; tensor var_1589_to_fp16 = const()[name = tensor("op_1589_to_fp16"), val = tensor(0x1p-3)]; tensor attn_73_cast_fp16 = mul(x = var_1588_cast_fp16, y = var_1589_to_fp16)[name = tensor("attn_73_cast_fp16")]; tensor attn_73_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_73_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_73_cast_fp16_to_fp32 = cast(dtype = attn_73_cast_fp16_to_fp32_dtype_0, x = attn_73_cast_fp16)[name = tensor("cast_75")]; tensor input_185 = add(x = attn_73_cast_fp16_to_fp32, y = var_102)[name = tensor("input_185")]; tensor input_185_to_fp16_dtype_0 = const()[name = tensor("input_185_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_185_to_fp16 = cast(dtype = input_185_to_fp16_dtype_0, x = input_185)[name = tensor("cast_74")]; tensor attn_75_cast_fp16 = softmax(axis = var_1548, x = input_185_to_fp16)[name = tensor("attn_75_cast_fp16")]; tensor out_37_transpose_x_0 = const()[name = tensor("out_37_transpose_x_0"), val = tensor(false)]; tensor out_37_transpose_y_0 = const()[name = tensor("out_37_transpose_y_0"), val = tensor(false)]; tensor v_t_19_cast_fp16 = transpose(perm = v_t_19_perm_0, x = v_37_cast_fp16)[name = tensor("transpose_129")]; tensor out_37_cast_fp16 = matmul(transpose_x = out_37_transpose_x_0, transpose_y = out_37_transpose_y_0, x = attn_75_cast_fp16, y = v_t_19_cast_fp16)[name = tensor("out_37_cast_fp16")]; tensor var_1600_perm_0 = const()[name = tensor("op_1600_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1601 = const()[name = tensor("op_1601"), val = tensor([1, 110, -1])]; tensor var_1600_cast_fp16 = transpose(perm = var_1600_perm_0, x = out_37_cast_fp16)[name = tensor("transpose_126")]; tensor input_187_cast_fp16 = reshape(shape = var_1601, x = var_1600_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor layers_9_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_9_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138306880)))]; tensor linear_46_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_9_self_attn_o_proj_weight_to_fp16, x = input_187_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_189_cast_fp16 = add(x = input_183_cast_fp16, y = linear_46_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor x_93_axes_0 = const()[name = tensor("x_93_axes_0"), val = tensor([-1])]; tensor layers_9_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_9_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139486592)))]; tensor x_93_cast_fp16 = layer_norm(axes = x_93_axes_0, epsilon = var_1555_to_fp16, gamma = layers_9_norm_xa_query_weight_to_fp16, x = input_189_cast_fp16)[name = tensor("x_93_cast_fp16")]; tensor memory_19_axes_0 = const()[name = tensor("memory_19_axes_0"), val = tensor([-1])]; tensor layers_9_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_9_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139488192)))]; tensor memory_19_cast_fp16 = layer_norm(axes = memory_19_axes_0, epsilon = var_1555_to_fp16, gamma = layers_9_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_19_cast_fp16")]; tensor layers_9_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_9_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139489792)))]; tensor linear_47_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_9_cross_attn_q_proj_weight_to_fp16, x = x_93_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor var_1624 = const()[name = tensor("op_1624"), val = tensor([1, 110, 1, 128])]; tensor var_1625_cast_fp16 = reshape(shape = var_1624, x = linear_47_cast_fp16)[name = tensor("op_1625_cast_fp16")]; tensor layers_9_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_9_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139686464)))]; tensor linear_48_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_9_cross_attn_kv_proj_weight_to_fp16, x = memory_19_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor var_1629 = const()[name = tensor("op_1629"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_19_cast_fp16 = reshape(shape = var_1629, x = linear_48_cast_fp16)[name = tensor("kv_19_cast_fp16")]; tensor var_1633_begin_0 = const()[name = tensor("op_1633_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1633_end_0 = const()[name = tensor("op_1633_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_1633_end_mask_0 = const()[name = tensor("op_1633_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1633_squeeze_mask_0 = const()[name = tensor("op_1633_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1633_cast_fp16 = slice_by_index(begin = var_1633_begin_0, end = var_1633_end_0, end_mask = var_1633_end_mask_0, squeeze_mask = var_1633_squeeze_mask_0, x = kv_19_cast_fp16)[name = tensor("op_1633_cast_fp16")]; tensor var_1637_begin_0 = const()[name = tensor("op_1637_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_1637_end_0 = const()[name = tensor("op_1637_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_1637_end_mask_0 = const()[name = tensor("op_1637_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1637_squeeze_mask_0 = const()[name = tensor("op_1637_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1637_cast_fp16 = slice_by_index(begin = var_1637_begin_0, end = var_1637_end_0, end_mask = var_1637_end_mask_0, squeeze_mask = var_1637_squeeze_mask_0, x = kv_19_cast_fp16)[name = tensor("op_1637_cast_fp16")]; tensor v_39_perm_0 = const()[name = tensor("v_39_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1640_transpose_x_0 = const()[name = tensor("op_1640_transpose_x_0"), val = tensor(false)]; tensor var_1640_transpose_y_0 = const()[name = tensor("op_1640_transpose_y_0"), val = tensor(false)]; tensor transpose_104_perm_0 = const()[name = tensor("transpose_104_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_105_perm_0 = const()[name = tensor("transpose_105_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_105 = transpose(perm = transpose_105_perm_0, x = var_1633_cast_fp16)[name = tensor("transpose_123")]; tensor transpose_104 = transpose(perm = transpose_104_perm_0, x = var_1625_cast_fp16)[name = tensor("transpose_124")]; tensor var_1640_cast_fp16 = matmul(transpose_x = var_1640_transpose_x_0, transpose_y = var_1640_transpose_y_0, x = transpose_104, y = transpose_105)[name = tensor("op_1640_cast_fp16")]; tensor var_1641_to_fp16 = const()[name = tensor("op_1641_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_77_cast_fp16 = mul(x = var_1640_cast_fp16, y = var_1641_to_fp16)[name = tensor("attn_77_cast_fp16")]; tensor var_1539_to_fp16 = const()[name = tensor("op_1539_to_fp16"), val = tensor(-inf)]; tensor input_191_cast_fp16 = select(a = var_1539_to_fp16, b = attn_77_cast_fp16, cond = var_151)[name = tensor("input_191_cast_fp16")]; tensor attn_79_cast_fp16 = softmax(axis = var_1548, x = input_191_cast_fp16)[name = tensor("attn_79_cast_fp16")]; tensor out_39_transpose_x_0 = const()[name = tensor("out_39_transpose_x_0"), val = tensor(false)]; tensor out_39_transpose_y_0 = const()[name = tensor("out_39_transpose_y_0"), val = tensor(false)]; tensor v_39_cast_fp16 = transpose(perm = v_39_perm_0, x = var_1637_cast_fp16)[name = tensor("transpose_125")]; tensor out_39_cast_fp16 = matmul(transpose_x = out_39_transpose_x_0, transpose_y = out_39_transpose_y_0, x = attn_79_cast_fp16, y = v_39_cast_fp16)[name = tensor("out_39_cast_fp16")]; tensor var_1649_perm_0 = const()[name = tensor("op_1649_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1650 = const()[name = tensor("op_1650"), val = tensor([1, 110, -1])]; tensor var_1649_cast_fp16 = transpose(perm = var_1649_perm_0, x = out_39_cast_fp16)[name = tensor("transpose_122")]; tensor input_193_cast_fp16 = reshape(shape = var_1650, x = var_1649_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor layers_9_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_9_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140079744)))]; tensor linear_49_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_9_cross_attn_o_proj_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor input_195_cast_fp16 = add(x = input_189_cast_fp16, y = linear_49_cast_fp16)[name = tensor("input_195_cast_fp16")]; tensor x_95_axes_0 = const()[name = tensor("x_95_axes_0"), val = tensor([-1])]; tensor layers_9_norm_ff_weight_to_fp16 = const()[name = tensor("layers_9_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140276416)))]; tensor x_95_cast_fp16 = layer_norm(axes = x_95_axes_0, epsilon = var_1555_to_fp16, gamma = layers_9_norm_ff_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor input_197_perm_0 = const()[name = tensor("input_197_perm_0"), val = tensor([0, 2, 1])]; tensor input_199_pad_type_0 = const()[name = tensor("input_199_pad_type_0"), val = tensor("valid")]; tensor input_199_strides_0 = const()[name = tensor("input_199_strides_0"), val = tensor([1])]; tensor input_199_pad_0 = const()[name = tensor("input_199_pad_0"), val = tensor([0, 0])]; tensor input_199_dilations_0 = const()[name = tensor("input_199_dilations_0"), val = tensor([1])]; tensor input_199_groups_0 = const()[name = tensor("input_199_groups_0"), val = tensor(1)]; tensor layers_9_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_9_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140278016)))]; tensor input_197_cast_fp16 = transpose(perm = input_197_perm_0, x = x_95_cast_fp16)[name = tensor("transpose_121")]; tensor input_199_cast_fp16 = conv(dilations = input_199_dilations_0, groups = input_199_groups_0, pad = input_199_pad_0, pad_type = input_199_pad_type_0, strides = input_199_strides_0, weight = layers_9_ffn_conv1_weight_to_fp16, x = input_197_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor input_201_mode_0 = const()[name = tensor("input_201_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_201_cast_fp16 = gelu(mode = input_201_mode_0, x = input_199_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor x_97_pad_type_0 = const()[name = tensor("x_97_pad_type_0"), val = tensor("valid")]; tensor x_97_strides_0 = const()[name = tensor("x_97_strides_0"), val = tensor([1])]; tensor x_97_pad_0 = const()[name = tensor("x_97_pad_0"), val = tensor([0, 0])]; tensor x_97_dilations_0 = const()[name = tensor("x_97_dilations_0"), val = tensor([1])]; tensor x_97_groups_0 = const()[name = tensor("x_97_groups_0"), val = tensor(1)]; tensor layers_9_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_9_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144996672)))]; tensor x_97_cast_fp16 = conv(dilations = x_97_dilations_0, groups = x_97_groups_0, pad = x_97_pad_0, pad_type = x_97_pad_type_0, strides = x_97_strides_0, weight = layers_9_ffn_conv2_weight_to_fp16, x = input_201_cast_fp16)[name = tensor("x_97_cast_fp16")]; tensor x_99_perm_0 = const()[name = tensor("x_99_perm_0"), val = tensor([0, 2, 1])]; tensor x_99_cast_fp16 = transpose(perm = x_99_perm_0, x = x_97_cast_fp16)[name = tensor("transpose_120")]; tensor input_203_cast_fp16 = add(x = input_195_cast_fp16, y = x_99_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor k_padded_19_pad_0 = const()[name = tensor("k_padded_19_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_19_mode_0 = const()[name = tensor("k_padded_19_mode_0"), val = tensor("constant")]; tensor const_70_to_fp16 = const()[name = tensor("const_70_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_19_cast_fp16 = pad(constant_val = const_70_to_fp16, mode = k_padded_19_mode_0, pad = k_padded_19_pad_0, x = k_37_cast_fp16)[name = tensor("k_padded_19_cast_fp16")]; tensor v_padded_19_pad_0 = const()[name = tensor("v_padded_19_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_19_mode_0 = const()[name = tensor("v_padded_19_mode_0"), val = tensor("constant")]; tensor const_71_to_fp16 = const()[name = tensor("const_71_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_19_cast_fp16 = pad(constant_val = const_71_to_fp16, mode = v_padded_19_mode_0, pad = v_padded_19_pad_0, x = v_37_cast_fp16)[name = tensor("v_padded_19_cast_fp16")]; tensor var_1702_axis_0 = const()[name = tensor("op_1702_axis_0"), val = tensor(0)]; tensor var_1702 = stack(axis = var_1702_axis_0, values = (k_padded_19_cast_fp16, v_padded_19_cast_fp16))[name = tensor("op_1702_cast_fp16")]; tensor var_1714 = const()[name = tensor("op_1714"), val = tensor(-1)]; tensor x_101_axes_0 = const()[name = tensor("x_101_axes_0"), val = tensor([-1])]; tensor layers_10_norm_sa_weight_to_fp16 = const()[name = tensor("layers_10_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149715328)))]; tensor var_1721_to_fp16 = const()[name = tensor("op_1721_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_101_cast_fp16 = layer_norm(axes = x_101_axes_0, epsilon = var_1721_to_fp16, gamma = layers_10_norm_sa_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor layers_10_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_10_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149716928)))]; tensor linear_50_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_10_self_attn_qkv_proj_weight_to_fp16, x = x_101_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_1739 = const()[name = tensor("op_1739"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_21_cast_fp16 = reshape(shape = var_1739, x = linear_50_cast_fp16)[name = tensor("qkv_21_cast_fp16")]; tensor q_61_begin_0 = const()[name = tensor("q_61_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_61_end_0 = const()[name = tensor("q_61_end_0"), val = tensor([1, 110, 1, 12, 64])]; tensor q_61_end_mask_0 = const()[name = tensor("q_61_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_61_squeeze_mask_0 = const()[name = tensor("q_61_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_61_cast_fp16 = slice_by_index(begin = q_61_begin_0, end = q_61_end_0, end_mask = q_61_end_mask_0, squeeze_mask = q_61_squeeze_mask_0, x = qkv_21_cast_fp16)[name = tensor("q_61_cast_fp16")]; tensor k_41_begin_0 = const()[name = tensor("k_41_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_41_end_0 = const()[name = tensor("k_41_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_41_end_mask_0 = const()[name = tensor("k_41_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_41_squeeze_mask_0 = const()[name = tensor("k_41_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_41_cast_fp16 = slice_by_index(begin = k_41_begin_0, end = k_41_end_0, end_mask = k_41_end_mask_0, squeeze_mask = k_41_squeeze_mask_0, x = qkv_21_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor v_41_begin_0 = const()[name = tensor("v_41_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_41_end_0 = const()[name = tensor("v_41_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_41_end_mask_0 = const()[name = tensor("v_41_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_41_squeeze_mask_0 = const()[name = tensor("v_41_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_41_cast_fp16 = slice_by_index(begin = v_41_begin_0, end = v_41_end_0, end_mask = v_41_end_mask_0, squeeze_mask = v_41_squeeze_mask_0, x = qkv_21_cast_fp16)[name = tensor("v_41_cast_fp16")]; tensor v_t_21_perm_0 = const()[name = tensor("v_t_21_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1754_transpose_x_0 = const()[name = tensor("op_1754_transpose_x_0"), val = tensor(false)]; tensor var_1754_transpose_y_0 = const()[name = tensor("op_1754_transpose_y_0"), val = tensor(false)]; tensor transpose_106_perm_0 = const()[name = tensor("transpose_106_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_107_perm_0 = const()[name = tensor("transpose_107_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_107 = transpose(perm = transpose_107_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_117")]; tensor transpose_106 = transpose(perm = transpose_106_perm_0, x = q_61_cast_fp16)[name = tensor("transpose_118")]; tensor var_1754_cast_fp16 = matmul(transpose_x = var_1754_transpose_x_0, transpose_y = var_1754_transpose_y_0, x = transpose_106, y = transpose_107)[name = tensor("op_1754_cast_fp16")]; tensor var_1755_to_fp16 = const()[name = tensor("op_1755_to_fp16"), val = tensor(0x1p-3)]; tensor attn_81_cast_fp16 = mul(x = var_1754_cast_fp16, y = var_1755_to_fp16)[name = tensor("attn_81_cast_fp16")]; tensor attn_81_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("attn_81_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor attn_81_cast_fp16_to_fp32 = cast(dtype = attn_81_cast_fp16_to_fp32_dtype_0, x = attn_81_cast_fp16)[name = tensor("cast_73")]; tensor input_205 = add(x = attn_81_cast_fp16_to_fp32, y = var_102)[name = tensor("input_205")]; tensor input_205_to_fp16_dtype_0 = const()[name = tensor("input_205_to_fp16_dtype_0"), val = tensor("fp16")]; tensor input_205_to_fp16 = cast(dtype = input_205_to_fp16_dtype_0, x = input_205)[name = tensor("cast_72")]; tensor attn_83_cast_fp16 = softmax(axis = var_1714, x = input_205_to_fp16)[name = tensor("attn_83_cast_fp16")]; tensor out_41_transpose_x_0 = const()[name = tensor("out_41_transpose_x_0"), val = tensor(false)]; tensor out_41_transpose_y_0 = const()[name = tensor("out_41_transpose_y_0"), val = tensor(false)]; tensor v_t_21_cast_fp16 = transpose(perm = v_t_21_perm_0, x = v_41_cast_fp16)[name = tensor("transpose_119")]; tensor out_41_cast_fp16 = matmul(transpose_x = out_41_transpose_x_0, transpose_y = out_41_transpose_y_0, x = attn_83_cast_fp16, y = v_t_21_cast_fp16)[name = tensor("out_41_cast_fp16")]; tensor var_1766_perm_0 = const()[name = tensor("op_1766_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1767 = const()[name = tensor("op_1767"), val = tensor([1, 110, -1])]; tensor var_1766_cast_fp16 = transpose(perm = var_1766_perm_0, x = out_41_cast_fp16)[name = tensor("transpose_116")]; tensor input_207_cast_fp16 = reshape(shape = var_1767, x = var_1766_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor layers_10_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_10_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153255936)))]; tensor linear_51_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_10_self_attn_o_proj_weight_to_fp16, x = input_207_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor input_209_cast_fp16 = add(x = input_203_cast_fp16, y = linear_51_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor x_103_axes_0 = const()[name = tensor("x_103_axes_0"), val = tensor([-1])]; tensor layers_10_norm_xa_query_weight_to_fp16 = const()[name = tensor("layers_10_norm_xa_query_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154435648)))]; tensor x_103_cast_fp16 = layer_norm(axes = x_103_axes_0, epsilon = var_1721_to_fp16, gamma = layers_10_norm_xa_query_weight_to_fp16, x = input_209_cast_fp16)[name = tensor("x_103_cast_fp16")]; tensor memory_21_axes_0 = const()[name = tensor("memory_21_axes_0"), val = tensor([-1])]; tensor layers_10_norm_xa_memory_weight_to_fp16 = const()[name = tensor("layers_10_norm_xa_memory_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154437248)))]; tensor memory_21_cast_fp16 = layer_norm(axes = memory_21_axes_0, epsilon = var_1721_to_fp16, gamma = layers_10_norm_xa_memory_weight_to_fp16, x = encoder_output)[name = tensor("memory_21_cast_fp16")]; tensor layers_10_cross_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_10_cross_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154438848)))]; tensor linear_52_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = layers_10_cross_attn_q_proj_weight_to_fp16, x = x_103_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor var_1790 = const()[name = tensor("op_1790"), val = tensor([1, 110, 1, 128])]; tensor var_1791_cast_fp16 = reshape(shape = var_1790, x = linear_52_cast_fp16)[name = tensor("op_1791_cast_fp16")]; tensor layers_10_cross_attn_kv_proj_weight_to_fp16 = const()[name = tensor("layers_10_cross_attn_kv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154635520)))]; tensor linear_53_cast_fp16 = linear(bias = linear_3_bias_0_to_fp16, weight = layers_10_cross_attn_kv_proj_weight_to_fp16, x = memory_21_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor var_1795 = const()[name = tensor("op_1795"), val = tensor([1, 256, 2, 1, 128])]; tensor kv_21_cast_fp16 = reshape(shape = var_1795, x = linear_53_cast_fp16)[name = tensor("kv_21_cast_fp16")]; tensor var_1799_begin_0 = const()[name = tensor("op_1799_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1799_end_0 = const()[name = tensor("op_1799_end_0"), val = tensor([1, 256, 1, 1, 128])]; tensor var_1799_end_mask_0 = const()[name = tensor("op_1799_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1799_squeeze_mask_0 = const()[name = tensor("op_1799_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1799_cast_fp16 = slice_by_index(begin = var_1799_begin_0, end = var_1799_end_0, end_mask = var_1799_end_mask_0, squeeze_mask = var_1799_squeeze_mask_0, x = kv_21_cast_fp16)[name = tensor("op_1799_cast_fp16")]; tensor var_1803_begin_0 = const()[name = tensor("op_1803_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor var_1803_end_0 = const()[name = tensor("op_1803_end_0"), val = tensor([1, 256, 2, 1, 128])]; tensor var_1803_end_mask_0 = const()[name = tensor("op_1803_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor var_1803_squeeze_mask_0 = const()[name = tensor("op_1803_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor var_1803_cast_fp16 = slice_by_index(begin = var_1803_begin_0, end = var_1803_end_0, end_mask = var_1803_end_mask_0, squeeze_mask = var_1803_squeeze_mask_0, x = kv_21_cast_fp16)[name = tensor("op_1803_cast_fp16")]; tensor v_43_perm_0 = const()[name = tensor("v_43_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1806_transpose_x_0 = const()[name = tensor("op_1806_transpose_x_0"), val = tensor(false)]; tensor var_1806_transpose_y_0 = const()[name = tensor("op_1806_transpose_y_0"), val = tensor(false)]; tensor transpose_108_perm_0 = const()[name = tensor("transpose_108_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_109_perm_0 = const()[name = tensor("transpose_109_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_109 = transpose(perm = transpose_109_perm_0, x = var_1799_cast_fp16)[name = tensor("transpose_113")]; tensor transpose_108 = transpose(perm = transpose_108_perm_0, x = var_1791_cast_fp16)[name = tensor("transpose_114")]; tensor var_1806_cast_fp16 = matmul(transpose_x = var_1806_transpose_x_0, transpose_y = var_1806_transpose_y_0, x = transpose_108, y = transpose_109)[name = tensor("op_1806_cast_fp16")]; tensor var_1807_to_fp16 = const()[name = tensor("op_1807_to_fp16"), val = tensor(0x1.6ap-4)]; tensor attn_85_cast_fp16 = mul(x = var_1806_cast_fp16, y = var_1807_to_fp16)[name = tensor("attn_85_cast_fp16")]; tensor var_1705_to_fp16 = const()[name = tensor("op_1705_to_fp16"), val = tensor(-inf)]; tensor input_211_cast_fp16 = select(a = var_1705_to_fp16, b = attn_85_cast_fp16, cond = var_151)[name = tensor("input_211_cast_fp16")]; tensor attn_87_cast_fp16 = softmax(axis = var_1714, x = input_211_cast_fp16)[name = tensor("attn_87_cast_fp16")]; tensor out_43_transpose_x_0 = const()[name = tensor("out_43_transpose_x_0"), val = tensor(false)]; tensor out_43_transpose_y_0 = const()[name = tensor("out_43_transpose_y_0"), val = tensor(false)]; tensor v_43_cast_fp16 = transpose(perm = v_43_perm_0, x = var_1803_cast_fp16)[name = tensor("transpose_115")]; tensor out_43_cast_fp16 = matmul(transpose_x = out_43_transpose_x_0, transpose_y = out_43_transpose_y_0, x = attn_87_cast_fp16, y = v_43_cast_fp16)[name = tensor("out_43_cast_fp16")]; tensor var_1815_perm_0 = const()[name = tensor("op_1815_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1816 = const()[name = tensor("op_1816"), val = tensor([1, 110, -1])]; tensor var_1815_cast_fp16 = transpose(perm = var_1815_perm_0, x = out_43_cast_fp16)[name = tensor("transpose_112")]; tensor input_213_cast_fp16 = reshape(shape = var_1816, x = var_1815_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor layers_10_cross_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_10_cross_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155028800)))]; tensor linear_54_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = layers_10_cross_attn_o_proj_weight_to_fp16, x = input_213_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor input_215_cast_fp16 = add(x = input_209_cast_fp16, y = linear_54_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor x_105_axes_0 = const()[name = tensor("x_105_axes_0"), val = tensor([-1])]; tensor layers_10_norm_ff_weight_to_fp16 = const()[name = tensor("layers_10_norm_ff_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155225472)))]; tensor x_105_cast_fp16 = layer_norm(axes = x_105_axes_0, epsilon = var_1721_to_fp16, gamma = layers_10_norm_ff_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("x_105_cast_fp16")]; tensor input_217_perm_0 = const()[name = tensor("input_217_perm_0"), val = tensor([0, 2, 1])]; tensor input_219_pad_type_0 = const()[name = tensor("input_219_pad_type_0"), val = tensor("valid")]; tensor input_219_strides_0 = const()[name = tensor("input_219_strides_0"), val = tensor([1])]; tensor input_219_pad_0 = const()[name = tensor("input_219_pad_0"), val = tensor([0, 0])]; tensor input_219_dilations_0 = const()[name = tensor("input_219_dilations_0"), val = tensor([1])]; tensor input_219_groups_0 = const()[name = tensor("input_219_groups_0"), val = tensor(1)]; tensor layers_10_ffn_conv1_weight_to_fp16 = const()[name = tensor("layers_10_ffn_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155227072)))]; tensor input_217_cast_fp16 = transpose(perm = input_217_perm_0, x = x_105_cast_fp16)[name = tensor("transpose_111")]; tensor input_219_cast_fp16 = conv(dilations = input_219_dilations_0, groups = input_219_groups_0, pad = input_219_pad_0, pad_type = input_219_pad_type_0, strides = input_219_strides_0, weight = layers_10_ffn_conv1_weight_to_fp16, x = input_217_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_mode_0 = const()[name = tensor("input_221_mode_0"), val = tensor("TANH_APPROXIMATION")]; tensor input_221_cast_fp16 = gelu(mode = input_221_mode_0, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor x_107_pad_type_0 = const()[name = tensor("x_107_pad_type_0"), val = tensor("valid")]; tensor x_107_strides_0 = const()[name = tensor("x_107_strides_0"), val = tensor([1])]; tensor x_107_pad_0 = const()[name = tensor("x_107_pad_0"), val = tensor([0, 0])]; tensor x_107_dilations_0 = const()[name = tensor("x_107_dilations_0"), val = tensor([1])]; tensor x_107_groups_0 = const()[name = tensor("x_107_groups_0"), val = tensor(1)]; tensor layers_10_ffn_conv2_weight_to_fp16 = const()[name = tensor("layers_10_ffn_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159945728)))]; tensor x_107_cast_fp16 = conv(dilations = x_107_dilations_0, groups = x_107_groups_0, pad = x_107_pad_0, pad_type = x_107_pad_type_0, strides = x_107_strides_0, weight = layers_10_ffn_conv2_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("x_107_cast_fp16")]; tensor x_109_perm_0 = const()[name = tensor("x_109_perm_0"), val = tensor([0, 2, 1])]; tensor x_109_cast_fp16 = transpose(perm = x_109_perm_0, x = x_107_cast_fp16)[name = tensor("transpose_110")]; tensor input_223_cast_fp16 = add(x = input_215_cast_fp16, y = x_109_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor k_padded_21_pad_0 = const()[name = tensor("k_padded_21_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_21_mode_0 = const()[name = tensor("k_padded_21_mode_0"), val = tensor("constant")]; tensor const_77_to_fp16 = const()[name = tensor("const_77_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_21_cast_fp16 = pad(constant_val = const_77_to_fp16, mode = k_padded_21_mode_0, pad = k_padded_21_pad_0, x = k_41_cast_fp16)[name = tensor("k_padded_21_cast_fp16")]; tensor v_padded_21_pad_0 = const()[name = tensor("v_padded_21_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_21_mode_0 = const()[name = tensor("v_padded_21_mode_0"), val = tensor("constant")]; tensor const_78_to_fp16 = const()[name = tensor("const_78_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_21_cast_fp16 = pad(constant_val = const_78_to_fp16, mode = v_padded_21_mode_0, pad = v_padded_21_pad_0, x = v_41_cast_fp16)[name = tensor("v_padded_21_cast_fp16")]; tensor var_1868_axis_0 = const()[name = tensor("op_1868_axis_0"), val = tensor(0)]; tensor var_1868 = stack(axis = var_1868_axis_0, values = (k_padded_21_cast_fp16, v_padded_21_cast_fp16))[name = tensor("op_1868_cast_fp16")]; tensor x_111_axes_0 = const()[name = tensor("x_111_axes_0"), val = tensor([-1])]; tensor layers_11_norm_sa_weight_to_fp16 = const()[name = tensor("layers_11_norm_sa_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164664384)))]; tensor var_1884_to_fp16 = const()[name = tensor("op_1884_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_111_cast_fp16 = layer_norm(axes = x_111_axes_0, epsilon = var_1884_to_fp16, gamma = layers_11_norm_sa_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("x_111_cast_fp16")]; tensor layers_11_self_attn_qkv_proj_weight_to_fp16 = const()[name = tensor("layers_11_self_attn_qkv_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164665984)))]; tensor linear_55_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = layers_11_self_attn_qkv_proj_weight_to_fp16, x = x_111_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor var_1897 = const()[name = tensor("op_1897"), val = tensor([1, 110, 3, 12, 64])]; tensor qkv_cast_fp16 = reshape(shape = var_1897, x = linear_55_cast_fp16)[name = tensor("qkv_cast_fp16")]; tensor k_45_begin_0 = const()[name = tensor("k_45_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_45_end_0 = const()[name = tensor("k_45_end_0"), val = tensor([1, 110, 2, 12, 64])]; tensor k_45_end_mask_0 = const()[name = tensor("k_45_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_45_squeeze_mask_0 = const()[name = tensor("k_45_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_45_cast_fp16 = slice_by_index(begin = k_45_begin_0, end = k_45_end_0, end_mask = k_45_end_mask_0, squeeze_mask = k_45_squeeze_mask_0, x = qkv_cast_fp16)[name = tensor("k_45_cast_fp16")]; tensor v_45_begin_0 = const()[name = tensor("v_45_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_45_end_0 = const()[name = tensor("v_45_end_0"), val = tensor([1, 110, 3, 12, 64])]; tensor v_45_end_mask_0 = const()[name = tensor("v_45_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_45_squeeze_mask_0 = const()[name = tensor("v_45_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_45_cast_fp16 = slice_by_index(begin = v_45_begin_0, end = v_45_end_0, end_mask = v_45_end_mask_0, squeeze_mask = v_45_squeeze_mask_0, x = qkv_cast_fp16)[name = tensor("v_45_cast_fp16")]; tensor k_padded_pad_0 = const()[name = tensor("k_padded_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor k_padded_mode_0 = const()[name = tensor("k_padded_mode_0"), val = tensor("constant")]; tensor const_81_to_fp16 = const()[name = tensor("const_81_to_fp16"), val = tensor(0x0p+0)]; tensor k_padded_cast_fp16 = pad(constant_val = const_81_to_fp16, mode = k_padded_mode_0, pad = k_padded_pad_0, x = k_45_cast_fp16)[name = tensor("k_padded_cast_fp16")]; tensor v_padded_pad_0 = const()[name = tensor("v_padded_pad_0"), val = tensor([0, 0, 0, 402, 0, 0, 0, 0])]; tensor v_padded_mode_0 = const()[name = tensor("v_padded_mode_0"), val = tensor("constant")]; tensor const_82_to_fp16 = const()[name = tensor("const_82_to_fp16"), val = tensor(0x0p+0)]; tensor v_padded_cast_fp16 = pad(constant_val = const_82_to_fp16, mode = v_padded_mode_0, pad = v_padded_pad_0, x = v_45_cast_fp16)[name = tensor("v_padded_cast_fp16")]; tensor var_1958_axis_0 = const()[name = tensor("op_1958_axis_0"), val = tensor(0)]; tensor var_1958 = stack(axis = var_1958_axis_0, values = (k_padded_cast_fp16, v_padded_cast_fp16))[name = tensor("op_1958_cast_fp16")]; } -> (var_208, var_374, var_540, var_706, var_872, var_1038, var_1204, var_1370, var_1536, var_1702, var_1868, var_1958); }