program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}, {"coremltools-component-torch", "2.9.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor attention_mask, tensor input_ids) { tensor var_16 = const()[name = tensor("op_16"), val = tensor(0)]; tensor var_18 = const()[name = tensor("op_18"), val = tensor(-1)]; tensor var_19 = const()[name = tensor("op_19"), val = tensor(1)]; tensor var_55_batch_dims_0 = const()[name = tensor("op_55_batch_dims_0"), val = tensor(0)]; tensor var_55_validate_indices_0 = const()[name = tensor("op_55_validate_indices_0"), val = tensor(false)]; tensor encoder_embed_tokens_weight_to_fp16 = const()[name = tensor("encoder_embed_tokens_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor greater_equal_0_y_0 = const()[name = tensor("greater_equal_0_y_0"), val = tensor(0)]; tensor greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = tensor("greater_equal_0")]; tensor slice_by_index_0 = const()[name = tensor("slice_by_index_0"), val = tensor(256206)]; tensor add_0 = add(x = input_ids, y = slice_by_index_0)[name = tensor("add_0")]; tensor select_0 = select(a = input_ids, b = add_0, cond = greater_equal_0)[name = tensor("select_0")]; tensor var_55_cast_fp16_axis_0 = const()[name = tensor("op_55_cast_fp16_axis_0"), val = tensor(0)]; tensor var_55_cast_fp16 = gather(axis = var_55_cast_fp16_axis_0, batch_dims = var_55_batch_dims_0, indices = select_0, validate_indices = var_55_validate_indices_0, x = encoder_embed_tokens_weight_to_fp16)[name = tensor("op_55_cast_fp16")]; tensor var_56_to_fp16 = const()[name = tensor("op_56_to_fp16"), val = tensor(0x1p+5)]; tensor inputs_embeds_1_cast_fp16 = mul(x = var_55_cast_fp16, y = var_56_to_fp16)[name = tensor("inputs_embeds_1_cast_fp16")]; tensor var_61 = not_equal(x = input_ids, y = var_19)[name = tensor("op_61")]; tensor mask_1_dtype_0 = const()[name = tensor("mask_1_dtype_0"), val = tensor("int32")]; tensor var_63_exclusive_0 = const()[name = tensor("op_63_exclusive_0"), val = tensor(false)]; tensor var_63_reverse_0 = const()[name = tensor("op_63_reverse_0"), val = tensor(false)]; tensor mask_1 = cast(dtype = mask_1_dtype_0, x = var_61)[name = tensor("cast_56")]; tensor var_63 = cumsum(axis = var_19, exclusive = var_63_exclusive_0, reverse = var_63_reverse_0, x = mask_1)[name = tensor("op_63")]; tensor incremental_indices_1 = mul(x = var_63, y = mask_1)[name = tensor("incremental_indices_1")]; tensor var_69 = const()[name = tensor("op_69"), val = tensor(1)]; tensor var_70 = add(x = incremental_indices_1, y = var_69)[name = tensor("op_70")]; tensor var_72 = const()[name = tensor("op_72"), val = tensor([-1])]; tensor var_73 = reshape(shape = var_72, x = var_70)[name = tensor("op_73")]; tensor var_74_batch_dims_0 = const()[name = tensor("op_74_batch_dims_0"), val = tensor(0)]; tensor var_74_validate_indices_0 = const()[name = tensor("op_74_validate_indices_0"), val = tensor(false)]; tensor encoder_embed_positions_weights_to_fp16 = const()[name = tensor("encoder_embed_positions_weights_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(524710016)))]; tensor var_73_to_uint16_dtype_0 = const()[name = tensor("op_73_to_uint16_dtype_0"), val = tensor("uint16")]; tensor var_73_to_uint16 = cast(dtype = var_73_to_uint16_dtype_0, x = var_73)[name = tensor("cast_55")]; tensor var_74_cast_fp16_cast_uint16 = gather(axis = var_16, batch_dims = var_74_batch_dims_0, indices = var_73_to_uint16, validate_indices = var_74_validate_indices_0, x = encoder_embed_positions_weights_to_fp16)[name = tensor("op_74_cast_fp16_cast_uint16")]; tensor var_76 = const()[name = tensor("op_76"), val = tensor([1, 256, 1024])]; tensor var_77_cast_fp16 = reshape(shape = var_76, x = var_74_cast_fp16_cast_uint16)[name = tensor("op_77_cast_fp16")]; tensor input0_7_cast_fp16 = add(x = inputs_embeds_1_cast_fp16, y = var_77_cast_fp16)[name = tensor("input0_7_cast_fp16")]; tensor var_85_axes_0 = const()[name = tensor("op_85_axes_0"), val = tensor([1])]; tensor var_85 = expand_dims(axes = var_85_axes_0, x = attention_mask)[name = tensor("op_85")]; tensor var_86_axes_0 = const()[name = tensor("op_86_axes_0"), val = tensor([2])]; tensor var_86 = expand_dims(axes = var_86_axes_0, x = var_85)[name = tensor("op_86")]; tensor var_89_reps_0 = const()[name = tensor("op_89_reps_0"), val = tensor([1, 1, 256, 1])]; tensor var_89 = tile(reps = var_89_reps_0, x = var_86)[name = tensor("op_89")]; tensor const_6_to_fp16 = const()[name = tensor("const_6_to_fp16"), val = tensor(0x1p+0)]; tensor expanded_mask_1_to_fp16_dtype_0 = const()[name = tensor("expanded_mask_1_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_89_to_fp16 = cast(dtype = expanded_mask_1_to_fp16_dtype_0, x = var_89)[name = tensor("cast_54")]; tensor inverted_mask_1_cast_fp16 = sub(x = const_6_to_fp16, y = var_89_to_fp16)[name = tensor("inverted_mask_1_cast_fp16")]; tensor var_94_dtype_0 = const()[name = tensor("op_94_dtype_0"), val = tensor("bool")]; tensor var_10_to_fp16 = const()[name = tensor("op_10_to_fp16"), val = tensor(-inf)]; tensor inverted_mask_1_cast_fp16_to_bool = cast(dtype = var_94_dtype_0, x = inverted_mask_1_cast_fp16)[name = tensor("cast_53")]; tensor attention_mask0_1_cast_fp16 = select(a = var_10_to_fp16, b = inverted_mask_1_cast_fp16, cond = inverted_mask_1_cast_fp16_to_bool)[name = tensor("attention_mask0_1_cast_fp16")]; tensor hidden_states_3_axes_0 = const()[name = tensor("hidden_states_3_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526811328)))]; tensor encoder_layers_0_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526813440)))]; tensor var_6_to_fp16 = const()[name = tensor("op_6_to_fp16"), val = tensor(0x1.5p-17)]; tensor hidden_states_3_cast_fp16 = layer_norm(axes = hidden_states_3_axes_0, beta = encoder_layers_0_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_0_self_attn_layer_norm_weight_to_fp16, x = input0_7_cast_fp16)[name = tensor("hidden_states_3_cast_fp16")]; tensor encoder_layers_0_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526815552)))]; tensor encoder_layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528912768)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_layers_0_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_q_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_114 = const()[name = tensor("op_114"), val = tensor([1, 256, -1, 64])]; tensor var_115_cast_fp16 = reshape(shape = var_114, x = linear_0_cast_fp16)[name = tensor("op_115_cast_fp16")]; tensor encoder_layers_0_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528914880)))]; tensor encoder_layers_0_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531012096)))]; tensor linear_1_cast_fp16 = linear(bias = encoder_layers_0_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_k_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor encoder_layers_0_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531014208)))]; tensor encoder_layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533111424)))]; tensor linear_2_cast_fp16 = linear(bias = encoder_layers_0_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_v_proj_weight_to_fp16, x = hidden_states_3_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_123 = const()[name = tensor("op_123"), val = tensor([1, 256, -1, 64])]; tensor var_124_cast_fp16 = reshape(shape = var_123, x = linear_1_cast_fp16)[name = tensor("op_124_cast_fp16")]; tensor var_126 = const()[name = tensor("op_126"), val = tensor([1, 256, -1, 64])]; tensor var_127_cast_fp16 = reshape(shape = var_126, x = linear_2_cast_fp16)[name = tensor("op_127_cast_fp16")]; tensor value_2_perm_0 = const()[name = tensor("value_2_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_130_transpose_x_0 = const()[name = tensor("op_130_transpose_x_0"), val = tensor(false)]; tensor var_130_transpose_y_0 = const()[name = tensor("op_130_transpose_y_0"), val = tensor(false)]; tensor transpose_36_perm_0 = const()[name = tensor("transpose_36_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_37_perm_0 = const()[name = tensor("transpose_37_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_37 = transpose(perm = transpose_37_perm_0, x = var_124_cast_fp16)[name = tensor("transpose_105")]; tensor transpose_36 = transpose(perm = transpose_36_perm_0, x = var_115_cast_fp16)[name = tensor("transpose_106")]; tensor var_130_cast_fp16 = matmul(transpose_x = var_130_transpose_x_0, transpose_y = var_130_transpose_y_0, x = transpose_36, y = transpose_37)[name = tensor("op_130_cast_fp16")]; tensor var_131_to_fp16 = const()[name = tensor("op_131_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_2_cast_fp16 = mul(x = var_130_cast_fp16, y = var_131_to_fp16)[name = tensor("attn_weights_2_cast_fp16")]; tensor input_5_cast_fp16 = add(x = attn_weights_2_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor input4_1_cast_fp16 = softmax(axis = var_18, x = input_5_cast_fp16)[name = tensor("input4_1_cast_fp16")]; tensor attn_output_2_transpose_x_0 = const()[name = tensor("attn_output_2_transpose_x_0"), val = tensor(false)]; tensor attn_output_2_transpose_y_0 = const()[name = tensor("attn_output_2_transpose_y_0"), val = tensor(false)]; tensor value_2_cast_fp16 = transpose(perm = value_2_perm_0, x = var_127_cast_fp16)[name = tensor("transpose_107")]; tensor attn_output_2_cast_fp16 = matmul(transpose_x = attn_output_2_transpose_x_0, transpose_y = attn_output_2_transpose_y_0, x = input4_1_cast_fp16, y = value_2_cast_fp16)[name = tensor("attn_output_2_cast_fp16")]; tensor var_137_perm_0 = const()[name = tensor("op_137_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_139 = const()[name = tensor("op_139"), val = tensor([1, 256, -1])]; tensor var_137_cast_fp16 = transpose(perm = var_137_perm_0, x = attn_output_2_cast_fp16)[name = tensor("transpose_104")]; tensor var_140_cast_fp16 = reshape(shape = var_139, x = var_137_cast_fp16)[name = tensor("op_140_cast_fp16")]; tensor encoder_layers_0_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533113536)))]; tensor encoder_layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535210752)))]; tensor linear_3_cast_fp16 = linear(bias = encoder_layers_0_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_out_proj_weight_to_fp16, x = var_140_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor input2_1_cast_fp16 = add(x = input0_7_cast_fp16, y = linear_3_cast_fp16)[name = tensor("input2_1_cast_fp16")]; tensor input0_5_axes_0 = const()[name = tensor("input0_5_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535212864)))]; tensor encoder_layers_0_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535214976)))]; tensor input0_5_cast_fp16 = layer_norm(axes = input0_5_axes_0, beta = encoder_layers_0_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_0_final_layer_norm_weight_to_fp16, x = input2_1_cast_fp16)[name = tensor("input0_5_cast_fp16")]; tensor encoder_layers_0_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535217088)))]; tensor encoder_layers_0_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543605760)))]; tensor linear_4_cast_fp16 = linear(bias = encoder_layers_0_fc1_bias_to_fp16, weight = encoder_layers_0_fc1_weight_to_fp16, x = input0_5_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor var_154_cast_fp16 = relu(x = linear_4_cast_fp16)[name = tensor("op_154_cast_fp16")]; tensor encoder_layers_0_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543614016)))]; tensor encoder_layers_0_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552002688)))]; tensor linear_5_cast_fp16 = linear(bias = encoder_layers_0_fc2_bias_to_fp16, weight = encoder_layers_0_fc2_weight_to_fp16, x = var_154_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_160_cast_fp16 = add(x = input2_1_cast_fp16, y = linear_5_cast_fp16)[name = tensor("op_160_cast_fp16")]; tensor hidden_states_7_axes_0 = const()[name = tensor("hidden_states_7_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552004800)))]; tensor encoder_layers_1_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552006912)))]; tensor hidden_states_7_cast_fp16 = layer_norm(axes = hidden_states_7_axes_0, beta = encoder_layers_1_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_1_self_attn_layer_norm_weight_to_fp16, x = var_160_cast_fp16)[name = tensor("hidden_states_7_cast_fp16")]; tensor encoder_layers_1_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552009024)))]; tensor encoder_layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(554106240)))]; tensor linear_6_cast_fp16 = linear(bias = encoder_layers_1_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_q_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor var_179 = const()[name = tensor("op_179"), val = tensor([1, 256, -1, 64])]; tensor var_180_cast_fp16 = reshape(shape = var_179, x = linear_6_cast_fp16)[name = tensor("op_180_cast_fp16")]; tensor encoder_layers_1_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(554108352)))]; tensor encoder_layers_1_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556205568)))]; tensor linear_7_cast_fp16 = linear(bias = encoder_layers_1_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_k_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor encoder_layers_1_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556207680)))]; tensor encoder_layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(558304896)))]; tensor linear_8_cast_fp16 = linear(bias = encoder_layers_1_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_v_proj_weight_to_fp16, x = hidden_states_7_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_188 = const()[name = tensor("op_188"), val = tensor([1, 256, -1, 64])]; tensor var_189_cast_fp16 = reshape(shape = var_188, x = linear_7_cast_fp16)[name = tensor("op_189_cast_fp16")]; tensor var_191 = const()[name = tensor("op_191"), val = tensor([1, 256, -1, 64])]; tensor var_192_cast_fp16 = reshape(shape = var_191, x = linear_8_cast_fp16)[name = tensor("op_192_cast_fp16")]; tensor value_4_perm_0 = const()[name = tensor("value_4_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_195_transpose_x_0 = const()[name = tensor("op_195_transpose_x_0"), val = tensor(false)]; tensor var_195_transpose_y_0 = const()[name = tensor("op_195_transpose_y_0"), val = tensor(false)]; tensor transpose_38_perm_0 = const()[name = tensor("transpose_38_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_39_perm_0 = const()[name = tensor("transpose_39_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_39 = transpose(perm = transpose_39_perm_0, x = var_189_cast_fp16)[name = tensor("transpose_101")]; tensor transpose_38 = transpose(perm = transpose_38_perm_0, x = var_180_cast_fp16)[name = tensor("transpose_102")]; tensor var_195_cast_fp16 = matmul(transpose_x = var_195_transpose_x_0, transpose_y = var_195_transpose_y_0, x = transpose_38, y = transpose_39)[name = tensor("op_195_cast_fp16")]; tensor var_196_to_fp16 = const()[name = tensor("op_196_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_4_cast_fp16 = mul(x = var_195_cast_fp16, y = var_196_to_fp16)[name = tensor("attn_weights_4_cast_fp16")]; tensor input_11_cast_fp16 = add(x = attn_weights_4_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor input0_9_cast_fp16 = softmax(axis = var_18, x = input_11_cast_fp16)[name = tensor("input0_9_cast_fp16")]; tensor attn_output_4_transpose_x_0 = const()[name = tensor("attn_output_4_transpose_x_0"), val = tensor(false)]; tensor attn_output_4_transpose_y_0 = const()[name = tensor("attn_output_4_transpose_y_0"), val = tensor(false)]; tensor value_4_cast_fp16 = transpose(perm = value_4_perm_0, x = var_192_cast_fp16)[name = tensor("transpose_103")]; tensor attn_output_4_cast_fp16 = matmul(transpose_x = attn_output_4_transpose_x_0, transpose_y = attn_output_4_transpose_y_0, x = input0_9_cast_fp16, y = value_4_cast_fp16)[name = tensor("attn_output_4_cast_fp16")]; tensor var_202_perm_0 = const()[name = tensor("op_202_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_204 = const()[name = tensor("op_204"), val = tensor([1, 256, -1])]; tensor var_202_cast_fp16 = transpose(perm = var_202_perm_0, x = attn_output_4_cast_fp16)[name = tensor("transpose_100")]; tensor var_205_cast_fp16 = reshape(shape = var_204, x = var_202_cast_fp16)[name = tensor("op_205_cast_fp16")]; tensor encoder_layers_1_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(558307008)))]; tensor encoder_layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560404224)))]; tensor linear_9_cast_fp16 = linear(bias = encoder_layers_1_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_out_proj_weight_to_fp16, x = var_205_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor input_13_cast_fp16 = add(x = var_160_cast_fp16, y = linear_9_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor input0_11_axes_0 = const()[name = tensor("input0_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560406336)))]; tensor encoder_layers_1_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560408448)))]; tensor input0_11_cast_fp16 = layer_norm(axes = input0_11_axes_0, beta = encoder_layers_1_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_1_final_layer_norm_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("input0_11_cast_fp16")]; tensor encoder_layers_1_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(560410560)))]; tensor encoder_layers_1_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568799232)))]; tensor linear_10_cast_fp16 = linear(bias = encoder_layers_1_fc1_bias_to_fp16, weight = encoder_layers_1_fc1_weight_to_fp16, x = input0_11_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor var_219_cast_fp16 = relu(x = linear_10_cast_fp16)[name = tensor("op_219_cast_fp16")]; tensor encoder_layers_1_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568807488)))]; tensor encoder_layers_1_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577196160)))]; tensor linear_11_cast_fp16 = linear(bias = encoder_layers_1_fc2_bias_to_fp16, weight = encoder_layers_1_fc2_weight_to_fp16, x = var_219_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor var_225_cast_fp16 = add(x = input_13_cast_fp16, y = linear_11_cast_fp16)[name = tensor("op_225_cast_fp16")]; tensor hidden_states_11_axes_0 = const()[name = tensor("hidden_states_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577198272)))]; tensor encoder_layers_2_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577200384)))]; tensor hidden_states_11_cast_fp16 = layer_norm(axes = hidden_states_11_axes_0, beta = encoder_layers_2_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_2_self_attn_layer_norm_weight_to_fp16, x = var_225_cast_fp16)[name = tensor("hidden_states_11_cast_fp16")]; tensor encoder_layers_2_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577202496)))]; tensor encoder_layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579299712)))]; tensor linear_12_cast_fp16 = linear(bias = encoder_layers_2_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_q_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_244 = const()[name = tensor("op_244"), val = tensor([1, 256, -1, 64])]; tensor var_245_cast_fp16 = reshape(shape = var_244, x = linear_12_cast_fp16)[name = tensor("op_245_cast_fp16")]; tensor encoder_layers_2_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579301824)))]; tensor encoder_layers_2_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(581399040)))]; tensor linear_13_cast_fp16 = linear(bias = encoder_layers_2_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_k_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor encoder_layers_2_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(581401152)))]; tensor encoder_layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(583498368)))]; tensor linear_14_cast_fp16 = linear(bias = encoder_layers_2_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_v_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_253 = const()[name = tensor("op_253"), val = tensor([1, 256, -1, 64])]; tensor var_254_cast_fp16 = reshape(shape = var_253, x = linear_13_cast_fp16)[name = tensor("op_254_cast_fp16")]; tensor var_256 = const()[name = tensor("op_256"), val = tensor([1, 256, -1, 64])]; tensor var_257_cast_fp16 = reshape(shape = var_256, x = linear_14_cast_fp16)[name = tensor("op_257_cast_fp16")]; tensor value_6_perm_0 = const()[name = tensor("value_6_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_260_transpose_x_0 = const()[name = tensor("op_260_transpose_x_0"), val = tensor(false)]; tensor var_260_transpose_y_0 = const()[name = tensor("op_260_transpose_y_0"), val = tensor(false)]; tensor transpose_40_perm_0 = const()[name = tensor("transpose_40_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_41_perm_0 = const()[name = tensor("transpose_41_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_41 = transpose(perm = transpose_41_perm_0, x = var_254_cast_fp16)[name = tensor("transpose_97")]; tensor transpose_40 = transpose(perm = transpose_40_perm_0, x = var_245_cast_fp16)[name = tensor("transpose_98")]; tensor var_260_cast_fp16 = matmul(transpose_x = var_260_transpose_x_0, transpose_y = var_260_transpose_y_0, x = transpose_40, y = transpose_41)[name = tensor("op_260_cast_fp16")]; tensor var_261_to_fp16 = const()[name = tensor("op_261_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_6_cast_fp16 = mul(x = var_260_cast_fp16, y = var_261_to_fp16)[name = tensor("attn_weights_6_cast_fp16")]; tensor input_17_cast_fp16 = add(x = attn_weights_6_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input0_15_cast_fp16 = softmax(axis = var_18, x = input_17_cast_fp16)[name = tensor("input0_15_cast_fp16")]; tensor attn_output_6_transpose_x_0 = const()[name = tensor("attn_output_6_transpose_x_0"), val = tensor(false)]; tensor attn_output_6_transpose_y_0 = const()[name = tensor("attn_output_6_transpose_y_0"), val = tensor(false)]; tensor value_6_cast_fp16 = transpose(perm = value_6_perm_0, x = var_257_cast_fp16)[name = tensor("transpose_99")]; tensor attn_output_6_cast_fp16 = matmul(transpose_x = attn_output_6_transpose_x_0, transpose_y = attn_output_6_transpose_y_0, x = input0_15_cast_fp16, y = value_6_cast_fp16)[name = tensor("attn_output_6_cast_fp16")]; tensor var_267_perm_0 = const()[name = tensor("op_267_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_269 = const()[name = tensor("op_269"), val = tensor([1, 256, -1])]; tensor var_267_cast_fp16 = transpose(perm = var_267_perm_0, x = attn_output_6_cast_fp16)[name = tensor("transpose_96")]; tensor var_270_cast_fp16 = reshape(shape = var_269, x = var_267_cast_fp16)[name = tensor("op_270_cast_fp16")]; tensor encoder_layers_2_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(583500480)))]; tensor encoder_layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(585597696)))]; tensor linear_15_cast_fp16 = linear(bias = encoder_layers_2_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_out_proj_weight_to_fp16, x = var_270_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor input_19_cast_fp16 = add(x = var_225_cast_fp16, y = linear_15_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input0_17_axes_0 = const()[name = tensor("input0_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(585599808)))]; tensor encoder_layers_2_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(585601920)))]; tensor input0_17_cast_fp16 = layer_norm(axes = input0_17_axes_0, beta = encoder_layers_2_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_2_final_layer_norm_weight_to_fp16, x = input_19_cast_fp16)[name = tensor("input0_17_cast_fp16")]; tensor encoder_layers_2_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(585604032)))]; tensor encoder_layers_2_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(593992704)))]; tensor linear_16_cast_fp16 = linear(bias = encoder_layers_2_fc1_bias_to_fp16, weight = encoder_layers_2_fc1_weight_to_fp16, x = input0_17_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor var_284_cast_fp16 = relu(x = linear_16_cast_fp16)[name = tensor("op_284_cast_fp16")]; tensor encoder_layers_2_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(594000960)))]; tensor encoder_layers_2_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602389632)))]; tensor linear_17_cast_fp16 = linear(bias = encoder_layers_2_fc2_bias_to_fp16, weight = encoder_layers_2_fc2_weight_to_fp16, x = var_284_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor var_290_cast_fp16 = add(x = input_19_cast_fp16, y = linear_17_cast_fp16)[name = tensor("op_290_cast_fp16")]; tensor hidden_states_15_axes_0 = const()[name = tensor("hidden_states_15_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602391744)))]; tensor encoder_layers_3_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602393856)))]; tensor hidden_states_15_cast_fp16 = layer_norm(axes = hidden_states_15_axes_0, beta = encoder_layers_3_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_3_self_attn_layer_norm_weight_to_fp16, x = var_290_cast_fp16)[name = tensor("hidden_states_15_cast_fp16")]; tensor encoder_layers_3_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602395968)))]; tensor encoder_layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604493184)))]; tensor linear_18_cast_fp16 = linear(bias = encoder_layers_3_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_q_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_309 = const()[name = tensor("op_309"), val = tensor([1, 256, -1, 64])]; tensor var_310_cast_fp16 = reshape(shape = var_309, x = linear_18_cast_fp16)[name = tensor("op_310_cast_fp16")]; tensor encoder_layers_3_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604495296)))]; tensor encoder_layers_3_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606592512)))]; tensor linear_19_cast_fp16 = linear(bias = encoder_layers_3_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_k_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor encoder_layers_3_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606594624)))]; tensor encoder_layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608691840)))]; tensor linear_20_cast_fp16 = linear(bias = encoder_layers_3_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_v_proj_weight_to_fp16, x = hidden_states_15_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_318 = const()[name = tensor("op_318"), val = tensor([1, 256, -1, 64])]; tensor var_319_cast_fp16 = reshape(shape = var_318, x = linear_19_cast_fp16)[name = tensor("op_319_cast_fp16")]; tensor var_321 = const()[name = tensor("op_321"), val = tensor([1, 256, -1, 64])]; tensor var_322_cast_fp16 = reshape(shape = var_321, x = linear_20_cast_fp16)[name = tensor("op_322_cast_fp16")]; tensor value_8_perm_0 = const()[name = tensor("value_8_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_325_transpose_x_0 = const()[name = tensor("op_325_transpose_x_0"), val = tensor(false)]; tensor var_325_transpose_y_0 = const()[name = tensor("op_325_transpose_y_0"), val = tensor(false)]; tensor transpose_42_perm_0 = const()[name = tensor("transpose_42_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_43_perm_0 = const()[name = tensor("transpose_43_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_43 = transpose(perm = transpose_43_perm_0, x = var_319_cast_fp16)[name = tensor("transpose_93")]; tensor transpose_42 = transpose(perm = transpose_42_perm_0, x = var_310_cast_fp16)[name = tensor("transpose_94")]; tensor var_325_cast_fp16 = matmul(transpose_x = var_325_transpose_x_0, transpose_y = var_325_transpose_y_0, x = transpose_42, y = transpose_43)[name = tensor("op_325_cast_fp16")]; tensor var_326_to_fp16 = const()[name = tensor("op_326_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_8_cast_fp16 = mul(x = var_325_cast_fp16, y = var_326_to_fp16)[name = tensor("attn_weights_8_cast_fp16")]; tensor input_23_cast_fp16 = add(x = attn_weights_8_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor input0_21_cast_fp16 = softmax(axis = var_18, x = input_23_cast_fp16)[name = tensor("input0_21_cast_fp16")]; tensor attn_output_8_transpose_x_0 = const()[name = tensor("attn_output_8_transpose_x_0"), val = tensor(false)]; tensor attn_output_8_transpose_y_0 = const()[name = tensor("attn_output_8_transpose_y_0"), val = tensor(false)]; tensor value_8_cast_fp16 = transpose(perm = value_8_perm_0, x = var_322_cast_fp16)[name = tensor("transpose_95")]; tensor attn_output_8_cast_fp16 = matmul(transpose_x = attn_output_8_transpose_x_0, transpose_y = attn_output_8_transpose_y_0, x = input0_21_cast_fp16, y = value_8_cast_fp16)[name = tensor("attn_output_8_cast_fp16")]; tensor var_332_perm_0 = const()[name = tensor("op_332_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_334 = const()[name = tensor("op_334"), val = tensor([1, 256, -1])]; tensor var_332_cast_fp16 = transpose(perm = var_332_perm_0, x = attn_output_8_cast_fp16)[name = tensor("transpose_92")]; tensor var_335_cast_fp16 = reshape(shape = var_334, x = var_332_cast_fp16)[name = tensor("op_335_cast_fp16")]; tensor encoder_layers_3_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608693952)))]; tensor encoder_layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(610791168)))]; tensor linear_21_cast_fp16 = linear(bias = encoder_layers_3_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_out_proj_weight_to_fp16, x = var_335_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor input_25_cast_fp16 = add(x = var_290_cast_fp16, y = linear_21_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor input0_23_axes_0 = const()[name = tensor("input0_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(610793280)))]; tensor encoder_layers_3_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(610795392)))]; tensor input0_23_cast_fp16 = layer_norm(axes = input0_23_axes_0, beta = encoder_layers_3_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_3_final_layer_norm_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("input0_23_cast_fp16")]; tensor encoder_layers_3_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(610797504)))]; tensor encoder_layers_3_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(619186176)))]; tensor linear_22_cast_fp16 = linear(bias = encoder_layers_3_fc1_bias_to_fp16, weight = encoder_layers_3_fc1_weight_to_fp16, x = input0_23_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor var_349_cast_fp16 = relu(x = linear_22_cast_fp16)[name = tensor("op_349_cast_fp16")]; tensor encoder_layers_3_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(619194432)))]; tensor encoder_layers_3_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627583104)))]; tensor linear_23_cast_fp16 = linear(bias = encoder_layers_3_fc2_bias_to_fp16, weight = encoder_layers_3_fc2_weight_to_fp16, x = var_349_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor var_355_cast_fp16 = add(x = input_25_cast_fp16, y = linear_23_cast_fp16)[name = tensor("op_355_cast_fp16")]; tensor hidden_states_19_axes_0 = const()[name = tensor("hidden_states_19_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627585216)))]; tensor encoder_layers_4_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627587328)))]; tensor hidden_states_19_cast_fp16 = layer_norm(axes = hidden_states_19_axes_0, beta = encoder_layers_4_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_4_self_attn_layer_norm_weight_to_fp16, x = var_355_cast_fp16)[name = tensor("hidden_states_19_cast_fp16")]; tensor encoder_layers_4_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627589440)))]; tensor encoder_layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(629686656)))]; tensor linear_24_cast_fp16 = linear(bias = encoder_layers_4_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_q_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor var_374 = const()[name = tensor("op_374"), val = tensor([1, 256, -1, 64])]; tensor var_375_cast_fp16 = reshape(shape = var_374, x = linear_24_cast_fp16)[name = tensor("op_375_cast_fp16")]; tensor encoder_layers_4_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(629688768)))]; tensor encoder_layers_4_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631785984)))]; tensor linear_25_cast_fp16 = linear(bias = encoder_layers_4_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_k_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor encoder_layers_4_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631788096)))]; tensor encoder_layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(633885312)))]; tensor linear_26_cast_fp16 = linear(bias = encoder_layers_4_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_v_proj_weight_to_fp16, x = hidden_states_19_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor var_383 = const()[name = tensor("op_383"), val = tensor([1, 256, -1, 64])]; tensor var_384_cast_fp16 = reshape(shape = var_383, x = linear_25_cast_fp16)[name = tensor("op_384_cast_fp16")]; tensor var_386 = const()[name = tensor("op_386"), val = tensor([1, 256, -1, 64])]; tensor var_387_cast_fp16 = reshape(shape = var_386, x = linear_26_cast_fp16)[name = tensor("op_387_cast_fp16")]; tensor value_10_perm_0 = const()[name = tensor("value_10_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_390_transpose_x_0 = const()[name = tensor("op_390_transpose_x_0"), val = tensor(false)]; tensor var_390_transpose_y_0 = const()[name = tensor("op_390_transpose_y_0"), val = tensor(false)]; tensor transpose_44_perm_0 = const()[name = tensor("transpose_44_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_45_perm_0 = const()[name = tensor("transpose_45_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_45 = transpose(perm = transpose_45_perm_0, x = var_384_cast_fp16)[name = tensor("transpose_89")]; tensor transpose_44 = transpose(perm = transpose_44_perm_0, x = var_375_cast_fp16)[name = tensor("transpose_90")]; tensor var_390_cast_fp16 = matmul(transpose_x = var_390_transpose_x_0, transpose_y = var_390_transpose_y_0, x = transpose_44, y = transpose_45)[name = tensor("op_390_cast_fp16")]; tensor var_391_to_fp16 = const()[name = tensor("op_391_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_10_cast_fp16 = mul(x = var_390_cast_fp16, y = var_391_to_fp16)[name = tensor("attn_weights_10_cast_fp16")]; tensor input_29_cast_fp16 = add(x = attn_weights_10_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor input0_27_cast_fp16 = softmax(axis = var_18, x = input_29_cast_fp16)[name = tensor("input0_27_cast_fp16")]; tensor attn_output_10_transpose_x_0 = const()[name = tensor("attn_output_10_transpose_x_0"), val = tensor(false)]; tensor attn_output_10_transpose_y_0 = const()[name = tensor("attn_output_10_transpose_y_0"), val = tensor(false)]; tensor value_10_cast_fp16 = transpose(perm = value_10_perm_0, x = var_387_cast_fp16)[name = tensor("transpose_91")]; tensor attn_output_10_cast_fp16 = matmul(transpose_x = attn_output_10_transpose_x_0, transpose_y = attn_output_10_transpose_y_0, x = input0_27_cast_fp16, y = value_10_cast_fp16)[name = tensor("attn_output_10_cast_fp16")]; tensor var_397_perm_0 = const()[name = tensor("op_397_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_399 = const()[name = tensor("op_399"), val = tensor([1, 256, -1])]; tensor var_397_cast_fp16 = transpose(perm = var_397_perm_0, x = attn_output_10_cast_fp16)[name = tensor("transpose_88")]; tensor var_400_cast_fp16 = reshape(shape = var_399, x = var_397_cast_fp16)[name = tensor("op_400_cast_fp16")]; tensor encoder_layers_4_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(633887424)))]; tensor encoder_layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(635984640)))]; tensor linear_27_cast_fp16 = linear(bias = encoder_layers_4_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_out_proj_weight_to_fp16, x = var_400_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor input_31_cast_fp16 = add(x = var_355_cast_fp16, y = linear_27_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor input0_29_axes_0 = const()[name = tensor("input0_29_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(635986752)))]; tensor encoder_layers_4_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(635988864)))]; tensor input0_29_cast_fp16 = layer_norm(axes = input0_29_axes_0, beta = encoder_layers_4_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_4_final_layer_norm_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("input0_29_cast_fp16")]; tensor encoder_layers_4_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(635990976)))]; tensor encoder_layers_4_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644379648)))]; tensor linear_28_cast_fp16 = linear(bias = encoder_layers_4_fc1_bias_to_fp16, weight = encoder_layers_4_fc1_weight_to_fp16, x = input0_29_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor var_414_cast_fp16 = relu(x = linear_28_cast_fp16)[name = tensor("op_414_cast_fp16")]; tensor encoder_layers_4_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644387904)))]; tensor encoder_layers_4_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652776576)))]; tensor linear_29_cast_fp16 = linear(bias = encoder_layers_4_fc2_bias_to_fp16, weight = encoder_layers_4_fc2_weight_to_fp16, x = var_414_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor var_420_cast_fp16 = add(x = input_31_cast_fp16, y = linear_29_cast_fp16)[name = tensor("op_420_cast_fp16")]; tensor hidden_states_23_axes_0 = const()[name = tensor("hidden_states_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652778688)))]; tensor encoder_layers_5_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652780800)))]; tensor hidden_states_23_cast_fp16 = layer_norm(axes = hidden_states_23_axes_0, beta = encoder_layers_5_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_5_self_attn_layer_norm_weight_to_fp16, x = var_420_cast_fp16)[name = tensor("hidden_states_23_cast_fp16")]; tensor encoder_layers_5_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(652782912)))]; tensor encoder_layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654880128)))]; tensor linear_30_cast_fp16 = linear(bias = encoder_layers_5_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_q_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_439 = const()[name = tensor("op_439"), val = tensor([1, 256, -1, 64])]; tensor var_440_cast_fp16 = reshape(shape = var_439, x = linear_30_cast_fp16)[name = tensor("op_440_cast_fp16")]; tensor encoder_layers_5_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654882240)))]; tensor encoder_layers_5_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(656979456)))]; tensor linear_31_cast_fp16 = linear(bias = encoder_layers_5_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_k_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor encoder_layers_5_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(656981568)))]; tensor encoder_layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(659078784)))]; tensor linear_32_cast_fp16 = linear(bias = encoder_layers_5_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_v_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_448 = const()[name = tensor("op_448"), val = tensor([1, 256, -1, 64])]; tensor var_449_cast_fp16 = reshape(shape = var_448, x = linear_31_cast_fp16)[name = tensor("op_449_cast_fp16")]; tensor var_451 = const()[name = tensor("op_451"), val = tensor([1, 256, -1, 64])]; tensor var_452_cast_fp16 = reshape(shape = var_451, x = linear_32_cast_fp16)[name = tensor("op_452_cast_fp16")]; tensor value_12_perm_0 = const()[name = tensor("value_12_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_455_transpose_x_0 = const()[name = tensor("op_455_transpose_x_0"), val = tensor(false)]; tensor var_455_transpose_y_0 = const()[name = tensor("op_455_transpose_y_0"), val = tensor(false)]; tensor transpose_46_perm_0 = const()[name = tensor("transpose_46_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_47_perm_0 = const()[name = tensor("transpose_47_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_47 = transpose(perm = transpose_47_perm_0, x = var_449_cast_fp16)[name = tensor("transpose_85")]; tensor transpose_46 = transpose(perm = transpose_46_perm_0, x = var_440_cast_fp16)[name = tensor("transpose_86")]; tensor var_455_cast_fp16 = matmul(transpose_x = var_455_transpose_x_0, transpose_y = var_455_transpose_y_0, x = transpose_46, y = transpose_47)[name = tensor("op_455_cast_fp16")]; tensor var_456_to_fp16 = const()[name = tensor("op_456_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_12_cast_fp16 = mul(x = var_455_cast_fp16, y = var_456_to_fp16)[name = tensor("attn_weights_12_cast_fp16")]; tensor input_35_cast_fp16 = add(x = attn_weights_12_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor input0_33_cast_fp16 = softmax(axis = var_18, x = input_35_cast_fp16)[name = tensor("input0_33_cast_fp16")]; tensor attn_output_12_transpose_x_0 = const()[name = tensor("attn_output_12_transpose_x_0"), val = tensor(false)]; tensor attn_output_12_transpose_y_0 = const()[name = tensor("attn_output_12_transpose_y_0"), val = tensor(false)]; tensor value_12_cast_fp16 = transpose(perm = value_12_perm_0, x = var_452_cast_fp16)[name = tensor("transpose_87")]; tensor attn_output_12_cast_fp16 = matmul(transpose_x = attn_output_12_transpose_x_0, transpose_y = attn_output_12_transpose_y_0, x = input0_33_cast_fp16, y = value_12_cast_fp16)[name = tensor("attn_output_12_cast_fp16")]; tensor var_462_perm_0 = const()[name = tensor("op_462_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_464 = const()[name = tensor("op_464"), val = tensor([1, 256, -1])]; tensor var_462_cast_fp16 = transpose(perm = var_462_perm_0, x = attn_output_12_cast_fp16)[name = tensor("transpose_84")]; tensor var_465_cast_fp16 = reshape(shape = var_464, x = var_462_cast_fp16)[name = tensor("op_465_cast_fp16")]; tensor encoder_layers_5_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(659080896)))]; tensor encoder_layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(661178112)))]; tensor linear_33_cast_fp16 = linear(bias = encoder_layers_5_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_out_proj_weight_to_fp16, x = var_465_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor input_37_cast_fp16 = add(x = var_420_cast_fp16, y = linear_33_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor input0_35_axes_0 = const()[name = tensor("input0_35_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(661180224)))]; tensor encoder_layers_5_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(661182336)))]; tensor input0_35_cast_fp16 = layer_norm(axes = input0_35_axes_0, beta = encoder_layers_5_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_5_final_layer_norm_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("input0_35_cast_fp16")]; tensor encoder_layers_5_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(661184448)))]; tensor encoder_layers_5_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(669573120)))]; tensor linear_34_cast_fp16 = linear(bias = encoder_layers_5_fc1_bias_to_fp16, weight = encoder_layers_5_fc1_weight_to_fp16, x = input0_35_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor var_479_cast_fp16 = relu(x = linear_34_cast_fp16)[name = tensor("op_479_cast_fp16")]; tensor encoder_layers_5_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(669581376)))]; tensor encoder_layers_5_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677970048)))]; tensor linear_35_cast_fp16 = linear(bias = encoder_layers_5_fc2_bias_to_fp16, weight = encoder_layers_5_fc2_weight_to_fp16, x = var_479_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor var_485_cast_fp16 = add(x = input_37_cast_fp16, y = linear_35_cast_fp16)[name = tensor("op_485_cast_fp16")]; tensor hidden_states_27_axes_0 = const()[name = tensor("hidden_states_27_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677972160)))]; tensor encoder_layers_6_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677974272)))]; tensor hidden_states_27_cast_fp16 = layer_norm(axes = hidden_states_27_axes_0, beta = encoder_layers_6_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_6_self_attn_layer_norm_weight_to_fp16, x = var_485_cast_fp16)[name = tensor("hidden_states_27_cast_fp16")]; tensor encoder_layers_6_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677976384)))]; tensor encoder_layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680073600)))]; tensor linear_36_cast_fp16 = linear(bias = encoder_layers_6_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_q_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor var_504 = const()[name = tensor("op_504"), val = tensor([1, 256, -1, 64])]; tensor var_505_cast_fp16 = reshape(shape = var_504, x = linear_36_cast_fp16)[name = tensor("op_505_cast_fp16")]; tensor encoder_layers_6_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680075712)))]; tensor encoder_layers_6_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(682172928)))]; tensor linear_37_cast_fp16 = linear(bias = encoder_layers_6_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_k_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor encoder_layers_6_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(682175040)))]; tensor encoder_layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(684272256)))]; tensor linear_38_cast_fp16 = linear(bias = encoder_layers_6_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_v_proj_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_513 = const()[name = tensor("op_513"), val = tensor([1, 256, -1, 64])]; tensor var_514_cast_fp16 = reshape(shape = var_513, x = linear_37_cast_fp16)[name = tensor("op_514_cast_fp16")]; tensor var_516 = const()[name = tensor("op_516"), val = tensor([1, 256, -1, 64])]; tensor var_517_cast_fp16 = reshape(shape = var_516, x = linear_38_cast_fp16)[name = tensor("op_517_cast_fp16")]; tensor value_14_perm_0 = const()[name = tensor("value_14_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_520_transpose_x_0 = const()[name = tensor("op_520_transpose_x_0"), val = tensor(false)]; tensor var_520_transpose_y_0 = const()[name = tensor("op_520_transpose_y_0"), val = tensor(false)]; tensor transpose_48_perm_0 = const()[name = tensor("transpose_48_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_49_perm_0 = const()[name = tensor("transpose_49_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_49 = transpose(perm = transpose_49_perm_0, x = var_514_cast_fp16)[name = tensor("transpose_81")]; tensor transpose_48 = transpose(perm = transpose_48_perm_0, x = var_505_cast_fp16)[name = tensor("transpose_82")]; tensor var_520_cast_fp16 = matmul(transpose_x = var_520_transpose_x_0, transpose_y = var_520_transpose_y_0, x = transpose_48, y = transpose_49)[name = tensor("op_520_cast_fp16")]; tensor var_521_to_fp16 = const()[name = tensor("op_521_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_14_cast_fp16 = mul(x = var_520_cast_fp16, y = var_521_to_fp16)[name = tensor("attn_weights_14_cast_fp16")]; tensor input_41_cast_fp16 = add(x = attn_weights_14_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor input0_39_cast_fp16 = softmax(axis = var_18, x = input_41_cast_fp16)[name = tensor("input0_39_cast_fp16")]; tensor attn_output_14_transpose_x_0 = const()[name = tensor("attn_output_14_transpose_x_0"), val = tensor(false)]; tensor attn_output_14_transpose_y_0 = const()[name = tensor("attn_output_14_transpose_y_0"), val = tensor(false)]; tensor value_14_cast_fp16 = transpose(perm = value_14_perm_0, x = var_517_cast_fp16)[name = tensor("transpose_83")]; tensor attn_output_14_cast_fp16 = matmul(transpose_x = attn_output_14_transpose_x_0, transpose_y = attn_output_14_transpose_y_0, x = input0_39_cast_fp16, y = value_14_cast_fp16)[name = tensor("attn_output_14_cast_fp16")]; tensor var_527_perm_0 = const()[name = tensor("op_527_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_529 = const()[name = tensor("op_529"), val = tensor([1, 256, -1])]; tensor var_527_cast_fp16 = transpose(perm = var_527_perm_0, x = attn_output_14_cast_fp16)[name = tensor("transpose_80")]; tensor var_530_cast_fp16 = reshape(shape = var_529, x = var_527_cast_fp16)[name = tensor("op_530_cast_fp16")]; tensor encoder_layers_6_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(684274368)))]; tensor encoder_layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686371584)))]; tensor linear_39_cast_fp16 = linear(bias = encoder_layers_6_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_out_proj_weight_to_fp16, x = var_530_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor input_43_cast_fp16 = add(x = var_485_cast_fp16, y = linear_39_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor input0_41_axes_0 = const()[name = tensor("input0_41_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686373696)))]; tensor encoder_layers_6_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686375808)))]; tensor input0_41_cast_fp16 = layer_norm(axes = input0_41_axes_0, beta = encoder_layers_6_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_6_final_layer_norm_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("input0_41_cast_fp16")]; tensor encoder_layers_6_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686377920)))]; tensor encoder_layers_6_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(694766592)))]; tensor linear_40_cast_fp16 = linear(bias = encoder_layers_6_fc1_bias_to_fp16, weight = encoder_layers_6_fc1_weight_to_fp16, x = input0_41_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor var_544_cast_fp16 = relu(x = linear_40_cast_fp16)[name = tensor("op_544_cast_fp16")]; tensor encoder_layers_6_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(694774848)))]; tensor encoder_layers_6_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703163520)))]; tensor linear_41_cast_fp16 = linear(bias = encoder_layers_6_fc2_bias_to_fp16, weight = encoder_layers_6_fc2_weight_to_fp16, x = var_544_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor var_550_cast_fp16 = add(x = input_43_cast_fp16, y = linear_41_cast_fp16)[name = tensor("op_550_cast_fp16")]; tensor hidden_states_31_axes_0 = const()[name = tensor("hidden_states_31_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703165632)))]; tensor encoder_layers_7_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703167744)))]; tensor hidden_states_31_cast_fp16 = layer_norm(axes = hidden_states_31_axes_0, beta = encoder_layers_7_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_7_self_attn_layer_norm_weight_to_fp16, x = var_550_cast_fp16)[name = tensor("hidden_states_31_cast_fp16")]; tensor encoder_layers_7_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703169856)))]; tensor encoder_layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(705267072)))]; tensor linear_42_cast_fp16 = linear(bias = encoder_layers_7_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_q_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor var_569 = const()[name = tensor("op_569"), val = tensor([1, 256, -1, 64])]; tensor var_570_cast_fp16 = reshape(shape = var_569, x = linear_42_cast_fp16)[name = tensor("op_570_cast_fp16")]; tensor encoder_layers_7_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(705269184)))]; tensor encoder_layers_7_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(707366400)))]; tensor linear_43_cast_fp16 = linear(bias = encoder_layers_7_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_k_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor encoder_layers_7_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(707368512)))]; tensor encoder_layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709465728)))]; tensor linear_44_cast_fp16 = linear(bias = encoder_layers_7_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_v_proj_weight_to_fp16, x = hidden_states_31_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor var_578 = const()[name = tensor("op_578"), val = tensor([1, 256, -1, 64])]; tensor var_579_cast_fp16 = reshape(shape = var_578, x = linear_43_cast_fp16)[name = tensor("op_579_cast_fp16")]; tensor var_581 = const()[name = tensor("op_581"), val = tensor([1, 256, -1, 64])]; tensor var_582_cast_fp16 = reshape(shape = var_581, x = linear_44_cast_fp16)[name = tensor("op_582_cast_fp16")]; tensor value_16_perm_0 = const()[name = tensor("value_16_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_585_transpose_x_0 = const()[name = tensor("op_585_transpose_x_0"), val = tensor(false)]; tensor var_585_transpose_y_0 = const()[name = tensor("op_585_transpose_y_0"), val = tensor(false)]; tensor transpose_50_perm_0 = const()[name = tensor("transpose_50_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_51_perm_0 = const()[name = tensor("transpose_51_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_51 = transpose(perm = transpose_51_perm_0, x = var_579_cast_fp16)[name = tensor("transpose_77")]; tensor transpose_50 = transpose(perm = transpose_50_perm_0, x = var_570_cast_fp16)[name = tensor("transpose_78")]; tensor var_585_cast_fp16 = matmul(transpose_x = var_585_transpose_x_0, transpose_y = var_585_transpose_y_0, x = transpose_50, y = transpose_51)[name = tensor("op_585_cast_fp16")]; tensor var_586_to_fp16 = const()[name = tensor("op_586_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_16_cast_fp16 = mul(x = var_585_cast_fp16, y = var_586_to_fp16)[name = tensor("attn_weights_16_cast_fp16")]; tensor input_47_cast_fp16 = add(x = attn_weights_16_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor input0_45_cast_fp16 = softmax(axis = var_18, x = input_47_cast_fp16)[name = tensor("input0_45_cast_fp16")]; tensor attn_output_16_transpose_x_0 = const()[name = tensor("attn_output_16_transpose_x_0"), val = tensor(false)]; tensor attn_output_16_transpose_y_0 = const()[name = tensor("attn_output_16_transpose_y_0"), val = tensor(false)]; tensor value_16_cast_fp16 = transpose(perm = value_16_perm_0, x = var_582_cast_fp16)[name = tensor("transpose_79")]; tensor attn_output_16_cast_fp16 = matmul(transpose_x = attn_output_16_transpose_x_0, transpose_y = attn_output_16_transpose_y_0, x = input0_45_cast_fp16, y = value_16_cast_fp16)[name = tensor("attn_output_16_cast_fp16")]; tensor var_592_perm_0 = const()[name = tensor("op_592_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_594 = const()[name = tensor("op_594"), val = tensor([1, 256, -1])]; tensor var_592_cast_fp16 = transpose(perm = var_592_perm_0, x = attn_output_16_cast_fp16)[name = tensor("transpose_76")]; tensor var_595_cast_fp16 = reshape(shape = var_594, x = var_592_cast_fp16)[name = tensor("op_595_cast_fp16")]; tensor encoder_layers_7_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709467840)))]; tensor encoder_layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711565056)))]; tensor linear_45_cast_fp16 = linear(bias = encoder_layers_7_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_out_proj_weight_to_fp16, x = var_595_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor input_49_cast_fp16 = add(x = var_550_cast_fp16, y = linear_45_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor input0_47_axes_0 = const()[name = tensor("input0_47_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711567168)))]; tensor encoder_layers_7_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711569280)))]; tensor input0_47_cast_fp16 = layer_norm(axes = input0_47_axes_0, beta = encoder_layers_7_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_7_final_layer_norm_weight_to_fp16, x = input_49_cast_fp16)[name = tensor("input0_47_cast_fp16")]; tensor encoder_layers_7_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711571392)))]; tensor encoder_layers_7_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(719960064)))]; tensor linear_46_cast_fp16 = linear(bias = encoder_layers_7_fc1_bias_to_fp16, weight = encoder_layers_7_fc1_weight_to_fp16, x = input0_47_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor var_609_cast_fp16 = relu(x = linear_46_cast_fp16)[name = tensor("op_609_cast_fp16")]; tensor encoder_layers_7_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(719968320)))]; tensor encoder_layers_7_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728356992)))]; tensor linear_47_cast_fp16 = linear(bias = encoder_layers_7_fc2_bias_to_fp16, weight = encoder_layers_7_fc2_weight_to_fp16, x = var_609_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor var_615_cast_fp16 = add(x = input_49_cast_fp16, y = linear_47_cast_fp16)[name = tensor("op_615_cast_fp16")]; tensor hidden_states_35_axes_0 = const()[name = tensor("hidden_states_35_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728359104)))]; tensor encoder_layers_8_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728361216)))]; tensor hidden_states_35_cast_fp16 = layer_norm(axes = hidden_states_35_axes_0, beta = encoder_layers_8_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_8_self_attn_layer_norm_weight_to_fp16, x = var_615_cast_fp16)[name = tensor("hidden_states_35_cast_fp16")]; tensor encoder_layers_8_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728363328)))]; tensor encoder_layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(730460544)))]; tensor linear_48_cast_fp16 = linear(bias = encoder_layers_8_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_q_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor var_634 = const()[name = tensor("op_634"), val = tensor([1, 256, -1, 64])]; tensor var_635_cast_fp16 = reshape(shape = var_634, x = linear_48_cast_fp16)[name = tensor("op_635_cast_fp16")]; tensor encoder_layers_8_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(730462656)))]; tensor encoder_layers_8_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732559872)))]; tensor linear_49_cast_fp16 = linear(bias = encoder_layers_8_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_k_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor encoder_layers_8_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732561984)))]; tensor encoder_layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734659200)))]; tensor linear_50_cast_fp16 = linear(bias = encoder_layers_8_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_v_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_643 = const()[name = tensor("op_643"), val = tensor([1, 256, -1, 64])]; tensor var_644_cast_fp16 = reshape(shape = var_643, x = linear_49_cast_fp16)[name = tensor("op_644_cast_fp16")]; tensor var_646 = const()[name = tensor("op_646"), val = tensor([1, 256, -1, 64])]; tensor var_647_cast_fp16 = reshape(shape = var_646, x = linear_50_cast_fp16)[name = tensor("op_647_cast_fp16")]; tensor value_18_perm_0 = const()[name = tensor("value_18_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_650_transpose_x_0 = const()[name = tensor("op_650_transpose_x_0"), val = tensor(false)]; tensor var_650_transpose_y_0 = const()[name = tensor("op_650_transpose_y_0"), val = tensor(false)]; tensor transpose_52_perm_0 = const()[name = tensor("transpose_52_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_53_perm_0 = const()[name = tensor("transpose_53_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_53 = transpose(perm = transpose_53_perm_0, x = var_644_cast_fp16)[name = tensor("transpose_73")]; tensor transpose_52 = transpose(perm = transpose_52_perm_0, x = var_635_cast_fp16)[name = tensor("transpose_74")]; tensor var_650_cast_fp16 = matmul(transpose_x = var_650_transpose_x_0, transpose_y = var_650_transpose_y_0, x = transpose_52, y = transpose_53)[name = tensor("op_650_cast_fp16")]; tensor var_651_to_fp16 = const()[name = tensor("op_651_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_18_cast_fp16 = mul(x = var_650_cast_fp16, y = var_651_to_fp16)[name = tensor("attn_weights_18_cast_fp16")]; tensor input_53_cast_fp16 = add(x = attn_weights_18_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor input0_51_cast_fp16 = softmax(axis = var_18, x = input_53_cast_fp16)[name = tensor("input0_51_cast_fp16")]; tensor attn_output_18_transpose_x_0 = const()[name = tensor("attn_output_18_transpose_x_0"), val = tensor(false)]; tensor attn_output_18_transpose_y_0 = const()[name = tensor("attn_output_18_transpose_y_0"), val = tensor(false)]; tensor value_18_cast_fp16 = transpose(perm = value_18_perm_0, x = var_647_cast_fp16)[name = tensor("transpose_75")]; tensor attn_output_18_cast_fp16 = matmul(transpose_x = attn_output_18_transpose_x_0, transpose_y = attn_output_18_transpose_y_0, x = input0_51_cast_fp16, y = value_18_cast_fp16)[name = tensor("attn_output_18_cast_fp16")]; tensor var_657_perm_0 = const()[name = tensor("op_657_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_659 = const()[name = tensor("op_659"), val = tensor([1, 256, -1])]; tensor var_657_cast_fp16 = transpose(perm = var_657_perm_0, x = attn_output_18_cast_fp16)[name = tensor("transpose_72")]; tensor var_660_cast_fp16 = reshape(shape = var_659, x = var_657_cast_fp16)[name = tensor("op_660_cast_fp16")]; tensor encoder_layers_8_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734661312)))]; tensor encoder_layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736758528)))]; tensor linear_51_cast_fp16 = linear(bias = encoder_layers_8_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_out_proj_weight_to_fp16, x = var_660_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor input_55_cast_fp16 = add(x = var_615_cast_fp16, y = linear_51_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor input0_53_axes_0 = const()[name = tensor("input0_53_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736760640)))]; tensor encoder_layers_8_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736762752)))]; tensor input0_53_cast_fp16 = layer_norm(axes = input0_53_axes_0, beta = encoder_layers_8_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_8_final_layer_norm_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("input0_53_cast_fp16")]; tensor encoder_layers_8_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736764864)))]; tensor encoder_layers_8_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(745153536)))]; tensor linear_52_cast_fp16 = linear(bias = encoder_layers_8_fc1_bias_to_fp16, weight = encoder_layers_8_fc1_weight_to_fp16, x = input0_53_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor var_674_cast_fp16 = relu(x = linear_52_cast_fp16)[name = tensor("op_674_cast_fp16")]; tensor encoder_layers_8_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(745161792)))]; tensor encoder_layers_8_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753550464)))]; tensor linear_53_cast_fp16 = linear(bias = encoder_layers_8_fc2_bias_to_fp16, weight = encoder_layers_8_fc2_weight_to_fp16, x = var_674_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor var_680_cast_fp16 = add(x = input_55_cast_fp16, y = linear_53_cast_fp16)[name = tensor("op_680_cast_fp16")]; tensor hidden_states_39_axes_0 = const()[name = tensor("hidden_states_39_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753552576)))]; tensor encoder_layers_9_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753554688)))]; tensor hidden_states_39_cast_fp16 = layer_norm(axes = hidden_states_39_axes_0, beta = encoder_layers_9_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_9_self_attn_layer_norm_weight_to_fp16, x = var_680_cast_fp16)[name = tensor("hidden_states_39_cast_fp16")]; tensor encoder_layers_9_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753556800)))]; tensor encoder_layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(755654016)))]; tensor linear_54_cast_fp16 = linear(bias = encoder_layers_9_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_q_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor var_699 = const()[name = tensor("op_699"), val = tensor([1, 256, -1, 64])]; tensor var_700_cast_fp16 = reshape(shape = var_699, x = linear_54_cast_fp16)[name = tensor("op_700_cast_fp16")]; tensor encoder_layers_9_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(755656128)))]; tensor encoder_layers_9_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757753344)))]; tensor linear_55_cast_fp16 = linear(bias = encoder_layers_9_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_k_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor encoder_layers_9_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757755456)))]; tensor encoder_layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(759852672)))]; tensor linear_56_cast_fp16 = linear(bias = encoder_layers_9_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_v_proj_weight_to_fp16, x = hidden_states_39_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor var_708 = const()[name = tensor("op_708"), val = tensor([1, 256, -1, 64])]; tensor var_709_cast_fp16 = reshape(shape = var_708, x = linear_55_cast_fp16)[name = tensor("op_709_cast_fp16")]; tensor var_711 = const()[name = tensor("op_711"), val = tensor([1, 256, -1, 64])]; tensor var_712_cast_fp16 = reshape(shape = var_711, x = linear_56_cast_fp16)[name = tensor("op_712_cast_fp16")]; tensor value_20_perm_0 = const()[name = tensor("value_20_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_715_transpose_x_0 = const()[name = tensor("op_715_transpose_x_0"), val = tensor(false)]; tensor var_715_transpose_y_0 = const()[name = tensor("op_715_transpose_y_0"), val = tensor(false)]; tensor transpose_54_perm_0 = const()[name = tensor("transpose_54_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_55_perm_0 = const()[name = tensor("transpose_55_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_55 = transpose(perm = transpose_55_perm_0, x = var_709_cast_fp16)[name = tensor("transpose_69")]; tensor transpose_54 = transpose(perm = transpose_54_perm_0, x = var_700_cast_fp16)[name = tensor("transpose_70")]; tensor var_715_cast_fp16 = matmul(transpose_x = var_715_transpose_x_0, transpose_y = var_715_transpose_y_0, x = transpose_54, y = transpose_55)[name = tensor("op_715_cast_fp16")]; tensor var_716_to_fp16 = const()[name = tensor("op_716_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_20_cast_fp16 = mul(x = var_715_cast_fp16, y = var_716_to_fp16)[name = tensor("attn_weights_20_cast_fp16")]; tensor input_59_cast_fp16 = add(x = attn_weights_20_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor input0_57_cast_fp16 = softmax(axis = var_18, x = input_59_cast_fp16)[name = tensor("input0_57_cast_fp16")]; tensor attn_output_20_transpose_x_0 = const()[name = tensor("attn_output_20_transpose_x_0"), val = tensor(false)]; tensor attn_output_20_transpose_y_0 = const()[name = tensor("attn_output_20_transpose_y_0"), val = tensor(false)]; tensor value_20_cast_fp16 = transpose(perm = value_20_perm_0, x = var_712_cast_fp16)[name = tensor("transpose_71")]; tensor attn_output_20_cast_fp16 = matmul(transpose_x = attn_output_20_transpose_x_0, transpose_y = attn_output_20_transpose_y_0, x = input0_57_cast_fp16, y = value_20_cast_fp16)[name = tensor("attn_output_20_cast_fp16")]; tensor var_722_perm_0 = const()[name = tensor("op_722_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_724 = const()[name = tensor("op_724"), val = tensor([1, 256, -1])]; tensor var_722_cast_fp16 = transpose(perm = var_722_perm_0, x = attn_output_20_cast_fp16)[name = tensor("transpose_68")]; tensor var_725_cast_fp16 = reshape(shape = var_724, x = var_722_cast_fp16)[name = tensor("op_725_cast_fp16")]; tensor encoder_layers_9_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(759854784)))]; tensor encoder_layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(761952000)))]; tensor linear_57_cast_fp16 = linear(bias = encoder_layers_9_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_out_proj_weight_to_fp16, x = var_725_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor input_61_cast_fp16 = add(x = var_680_cast_fp16, y = linear_57_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor input0_59_axes_0 = const()[name = tensor("input0_59_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(761954112)))]; tensor encoder_layers_9_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(761956224)))]; tensor input0_59_cast_fp16 = layer_norm(axes = input0_59_axes_0, beta = encoder_layers_9_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_9_final_layer_norm_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("input0_59_cast_fp16")]; tensor encoder_layers_9_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(761958336)))]; tensor encoder_layers_9_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(770347008)))]; tensor linear_58_cast_fp16 = linear(bias = encoder_layers_9_fc1_bias_to_fp16, weight = encoder_layers_9_fc1_weight_to_fp16, x = input0_59_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor var_739_cast_fp16 = relu(x = linear_58_cast_fp16)[name = tensor("op_739_cast_fp16")]; tensor encoder_layers_9_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(770355264)))]; tensor encoder_layers_9_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778743936)))]; tensor linear_59_cast_fp16 = linear(bias = encoder_layers_9_fc2_bias_to_fp16, weight = encoder_layers_9_fc2_weight_to_fp16, x = var_739_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor var_745_cast_fp16 = add(x = input_61_cast_fp16, y = linear_59_cast_fp16)[name = tensor("op_745_cast_fp16")]; tensor hidden_states_43_axes_0 = const()[name = tensor("hidden_states_43_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778746048)))]; tensor encoder_layers_10_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778748160)))]; tensor hidden_states_43_cast_fp16 = layer_norm(axes = hidden_states_43_axes_0, beta = encoder_layers_10_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_10_self_attn_layer_norm_weight_to_fp16, x = var_745_cast_fp16)[name = tensor("hidden_states_43_cast_fp16")]; tensor encoder_layers_10_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778750272)))]; tensor encoder_layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780847488)))]; tensor linear_60_cast_fp16 = linear(bias = encoder_layers_10_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_q_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor("linear_60_cast_fp16")]; tensor var_764 = const()[name = tensor("op_764"), val = tensor([1, 256, -1, 64])]; tensor var_765_cast_fp16 = reshape(shape = var_764, x = linear_60_cast_fp16)[name = tensor("op_765_cast_fp16")]; tensor encoder_layers_10_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780849600)))]; tensor encoder_layers_10_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(782946816)))]; tensor linear_61_cast_fp16 = linear(bias = encoder_layers_10_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_k_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor encoder_layers_10_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(782948928)))]; tensor encoder_layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(785046144)))]; tensor linear_62_cast_fp16 = linear(bias = encoder_layers_10_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_v_proj_weight_to_fp16, x = hidden_states_43_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor var_773 = const()[name = tensor("op_773"), val = tensor([1, 256, -1, 64])]; tensor var_774_cast_fp16 = reshape(shape = var_773, x = linear_61_cast_fp16)[name = tensor("op_774_cast_fp16")]; tensor var_776 = const()[name = tensor("op_776"), val = tensor([1, 256, -1, 64])]; tensor var_777_cast_fp16 = reshape(shape = var_776, x = linear_62_cast_fp16)[name = tensor("op_777_cast_fp16")]; tensor value_22_perm_0 = const()[name = tensor("value_22_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_780_transpose_x_0 = const()[name = tensor("op_780_transpose_x_0"), val = tensor(false)]; tensor var_780_transpose_y_0 = const()[name = tensor("op_780_transpose_y_0"), val = tensor(false)]; tensor transpose_56_perm_0 = const()[name = tensor("transpose_56_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_57_perm_0 = const()[name = tensor("transpose_57_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_57 = transpose(perm = transpose_57_perm_0, x = var_774_cast_fp16)[name = tensor("transpose_65")]; tensor transpose_56 = transpose(perm = transpose_56_perm_0, x = var_765_cast_fp16)[name = tensor("transpose_66")]; tensor var_780_cast_fp16 = matmul(transpose_x = var_780_transpose_x_0, transpose_y = var_780_transpose_y_0, x = transpose_56, y = transpose_57)[name = tensor("op_780_cast_fp16")]; tensor var_781_to_fp16 = const()[name = tensor("op_781_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_22_cast_fp16 = mul(x = var_780_cast_fp16, y = var_781_to_fp16)[name = tensor("attn_weights_22_cast_fp16")]; tensor input_65_cast_fp16 = add(x = attn_weights_22_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor input0_63_cast_fp16 = softmax(axis = var_18, x = input_65_cast_fp16)[name = tensor("input0_63_cast_fp16")]; tensor attn_output_22_transpose_x_0 = const()[name = tensor("attn_output_22_transpose_x_0"), val = tensor(false)]; tensor attn_output_22_transpose_y_0 = const()[name = tensor("attn_output_22_transpose_y_0"), val = tensor(false)]; tensor value_22_cast_fp16 = transpose(perm = value_22_perm_0, x = var_777_cast_fp16)[name = tensor("transpose_67")]; tensor attn_output_22_cast_fp16 = matmul(transpose_x = attn_output_22_transpose_x_0, transpose_y = attn_output_22_transpose_y_0, x = input0_63_cast_fp16, y = value_22_cast_fp16)[name = tensor("attn_output_22_cast_fp16")]; tensor var_787_perm_0 = const()[name = tensor("op_787_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_789 = const()[name = tensor("op_789"), val = tensor([1, 256, -1])]; tensor var_787_cast_fp16 = transpose(perm = var_787_perm_0, x = attn_output_22_cast_fp16)[name = tensor("transpose_64")]; tensor var_790_cast_fp16 = reshape(shape = var_789, x = var_787_cast_fp16)[name = tensor("op_790_cast_fp16")]; tensor encoder_layers_10_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(785048256)))]; tensor encoder_layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(787145472)))]; tensor linear_63_cast_fp16 = linear(bias = encoder_layers_10_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_out_proj_weight_to_fp16, x = var_790_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor input_67_cast_fp16 = add(x = var_745_cast_fp16, y = linear_63_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor input0_65_axes_0 = const()[name = tensor("input0_65_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(787147584)))]; tensor encoder_layers_10_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(787149696)))]; tensor input0_65_cast_fp16 = layer_norm(axes = input0_65_axes_0, beta = encoder_layers_10_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_10_final_layer_norm_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("input0_65_cast_fp16")]; tensor encoder_layers_10_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(787151808)))]; tensor encoder_layers_10_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795540480)))]; tensor linear_64_cast_fp16 = linear(bias = encoder_layers_10_fc1_bias_to_fp16, weight = encoder_layers_10_fc1_weight_to_fp16, x = input0_65_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor var_804_cast_fp16 = relu(x = linear_64_cast_fp16)[name = tensor("op_804_cast_fp16")]; tensor encoder_layers_10_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795548736)))]; tensor encoder_layers_10_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(803937408)))]; tensor linear_65_cast_fp16 = linear(bias = encoder_layers_10_fc2_bias_to_fp16, weight = encoder_layers_10_fc2_weight_to_fp16, x = var_804_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor var_810_cast_fp16 = add(x = input_67_cast_fp16, y = linear_65_cast_fp16)[name = tensor("op_810_cast_fp16")]; tensor hidden_states_1_axes_0 = const()[name = tensor("hidden_states_1_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(803939520)))]; tensor encoder_layers_11_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(803941632)))]; tensor hidden_states_1_cast_fp16 = layer_norm(axes = hidden_states_1_axes_0, beta = encoder_layers_11_self_attn_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_11_self_attn_layer_norm_weight_to_fp16, x = var_810_cast_fp16)[name = tensor("hidden_states_1_cast_fp16")]; tensor encoder_layers_11_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(803943744)))]; tensor encoder_layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806040960)))]; tensor linear_66_cast_fp16 = linear(bias = encoder_layers_11_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_q_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor var_829 = const()[name = tensor("op_829"), val = tensor([1, 256, -1, 64])]; tensor var_830_cast_fp16 = reshape(shape = var_829, x = linear_66_cast_fp16)[name = tensor("op_830_cast_fp16")]; tensor encoder_layers_11_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806043072)))]; tensor encoder_layers_11_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(808140288)))]; tensor linear_67_cast_fp16 = linear(bias = encoder_layers_11_self_attn_k_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_k_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor encoder_layers_11_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(808142400)))]; tensor encoder_layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(810239616)))]; tensor linear_68_cast_fp16 = linear(bias = encoder_layers_11_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_v_proj_weight_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor var_838 = const()[name = tensor("op_838"), val = tensor([1, 256, -1, 64])]; tensor var_839_cast_fp16 = reshape(shape = var_838, x = linear_67_cast_fp16)[name = tensor("op_839_cast_fp16")]; tensor var_841 = const()[name = tensor("op_841"), val = tensor([1, 256, -1, 64])]; tensor var_842_cast_fp16 = reshape(shape = var_841, x = linear_68_cast_fp16)[name = tensor("op_842_cast_fp16")]; tensor value_1_perm_0 = const()[name = tensor("value_1_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_845_transpose_x_0 = const()[name = tensor("op_845_transpose_x_0"), val = tensor(false)]; tensor var_845_transpose_y_0 = const()[name = tensor("op_845_transpose_y_0"), val = tensor(false)]; tensor transpose_58_perm_0 = const()[name = tensor("transpose_58_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_59_perm_0 = const()[name = tensor("transpose_59_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_59 = transpose(perm = transpose_59_perm_0, x = var_839_cast_fp16)[name = tensor("transpose_61")]; tensor transpose_58 = transpose(perm = transpose_58_perm_0, x = var_830_cast_fp16)[name = tensor("transpose_62")]; tensor var_845_cast_fp16 = matmul(transpose_x = var_845_transpose_x_0, transpose_y = var_845_transpose_y_0, x = transpose_58, y = transpose_59)[name = tensor("op_845_cast_fp16")]; tensor var_846_to_fp16 = const()[name = tensor("op_846_to_fp16"), val = tensor(0x1p-3)]; tensor attn_weights_1_cast_fp16 = mul(x = var_845_cast_fp16, y = var_846_to_fp16)[name = tensor("attn_weights_1_cast_fp16")]; tensor input_4_cast_fp16 = add(x = attn_weights_1_cast_fp16, y = attention_mask0_1_cast_fp16)[name = tensor("input_4_cast_fp16")]; tensor input0_4_cast_fp16 = softmax(axis = var_18, x = input_4_cast_fp16)[name = tensor("input0_4_cast_fp16")]; tensor attn_output_1_transpose_x_0 = const()[name = tensor("attn_output_1_transpose_x_0"), val = tensor(false)]; tensor attn_output_1_transpose_y_0 = const()[name = tensor("attn_output_1_transpose_y_0"), val = tensor(false)]; tensor value_1_cast_fp16 = transpose(perm = value_1_perm_0, x = var_842_cast_fp16)[name = tensor("transpose_63")]; tensor attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = input0_4_cast_fp16, y = value_1_cast_fp16)[name = tensor("attn_output_1_cast_fp16")]; tensor var_852_perm_0 = const()[name = tensor("op_852_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_854 = const()[name = tensor("op_854"), val = tensor([1, 256, -1])]; tensor var_852_cast_fp16 = transpose(perm = var_852_perm_0, x = attn_output_1_cast_fp16)[name = tensor("transpose_60")]; tensor var_855_cast_fp16 = reshape(shape = var_854, x = var_852_cast_fp16)[name = tensor("op_855_cast_fp16")]; tensor encoder_layers_11_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(810241728)))]; tensor encoder_layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812338944)))]; tensor linear_69_cast_fp16 = linear(bias = encoder_layers_11_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_out_proj_weight_to_fp16, x = var_855_cast_fp16)[name = tensor("linear_69_cast_fp16")]; tensor input_2_cast_fp16 = add(x = var_810_cast_fp16, y = linear_69_cast_fp16)[name = tensor("input_2_cast_fp16")]; tensor input0_1_axes_0 = const()[name = tensor("input0_1_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812341056)))]; tensor encoder_layers_11_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812343168)))]; tensor input0_1_cast_fp16 = layer_norm(axes = input0_1_axes_0, beta = encoder_layers_11_final_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layers_11_final_layer_norm_weight_to_fp16, x = input_2_cast_fp16)[name = tensor("input0_1_cast_fp16")]; tensor encoder_layers_11_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(812345280)))]; tensor encoder_layers_11_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(820733952)))]; tensor linear_70_cast_fp16 = linear(bias = encoder_layers_11_fc1_bias_to_fp16, weight = encoder_layers_11_fc1_weight_to_fp16, x = input0_1_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor var_869_cast_fp16 = relu(x = linear_70_cast_fp16)[name = tensor("op_869_cast_fp16")]; tensor encoder_layers_11_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(820742208)))]; tensor encoder_layers_11_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(829130880)))]; tensor linear_71_cast_fp16 = linear(bias = encoder_layers_11_fc2_bias_to_fp16, weight = encoder_layers_11_fc2_weight_to_fp16, x = var_869_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor var_875_cast_fp16 = add(x = input_2_cast_fp16, y = linear_71_cast_fp16)[name = tensor("op_875_cast_fp16")]; tensor var_879_axes_0 = const()[name = tensor("op_879_axes_0"), val = tensor([-1])]; tensor encoder_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(829132992)))]; tensor encoder_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(829135104)))]; tensor var_879 = layer_norm(axes = var_879_axes_0, beta = encoder_layer_norm_bias_to_fp16, epsilon = var_6_to_fp16, gamma = encoder_layer_norm_weight_to_fp16, x = var_875_cast_fp16)[name = tensor("op_879_cast_fp16")]; } -> (var_879); }