program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.7.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor mel_spectrogram) { tensor var_95_pad_type_0 = const()[name = tensor("op_95_pad_type_0"), val = tensor("custom")]; tensor var_95_pad_0 = const()[name = tensor("op_95_pad_0"), val = tensor([1, 1])]; tensor var_95_strides_0 = const()[name = tensor("op_95_strides_0"), val = tensor([1])]; tensor var_95_dilations_0 = const()[name = tensor("op_95_dilations_0"), val = tensor([1])]; tensor var_95_groups_0 = const()[name = tensor("op_95_groups_0"), val = tensor(1)]; tensor mel_spectrogram_to_fp16_dtype_0 = const()[name = tensor("mel_spectrogram_to_fp16_dtype_0"), val = tensor("fp16")]; tensor encoder_conv1_weight_to_fp16 = const()[name = tensor("encoder_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor encoder_conv1_bias_to_fp16 = const()[name = tensor("encoder_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(983168)))]; tensor mel_spectrogram_to_fp16 = cast(dtype = mel_spectrogram_to_fp16_dtype_0, x = mel_spectrogram)[name = tensor("cast_132")]; tensor var_95_cast_fp16 = conv(bias = encoder_conv1_bias_to_fp16, dilations = var_95_dilations_0, groups = var_95_groups_0, pad = var_95_pad_0, pad_type = var_95_pad_type_0, strides = var_95_strides_0, weight = encoder_conv1_weight_to_fp16, x = mel_spectrogram_to_fp16)[name = tensor("op_95_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_95_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_103_pad_type_0 = const()[name = tensor("op_103_pad_type_0"), val = tensor("custom")]; tensor var_103_pad_0 = const()[name = tensor("op_103_pad_0"), val = tensor([1, 1])]; tensor var_103_strides_0 = const()[name = tensor("op_103_strides_0"), val = tensor([2])]; tensor var_103_dilations_0 = const()[name = tensor("op_103_dilations_0"), val = tensor([1])]; tensor var_103_groups_0 = const()[name = tensor("op_103_groups_0"), val = tensor(1)]; tensor encoder_conv2_weight_to_fp16 = const()[name = tensor("encoder_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985792)))]; tensor encoder_conv2_bias_to_fp16 = const()[name = tensor("encoder_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10816256)))]; tensor var_103_cast_fp16 = conv(bias = encoder_conv2_bias_to_fp16, dilations = var_103_dilations_0, groups = var_103_groups_0, pad = var_103_pad_0, pad_type = var_103_pad_type_0, strides = var_103_strides_0, weight = encoder_conv2_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("op_103_cast_fp16")]; tensor hidden_states_1_mode_0 = const()[name = tensor("hidden_states_1_mode_0"), val = tensor("EXACT")]; tensor hidden_states_1_cast_fp16 = gelu(mode = hidden_states_1_mode_0, x = var_103_cast_fp16)[name = tensor("hidden_states_1_cast_fp16")]; tensor hidden_states_3_perm_0 = const()[name = tensor("hidden_states_3_perm_0"), val = tensor([0, 2, 1])]; tensor encoder_embed_positions_weight_to_fp16 = const()[name = tensor("encoder_embed_positions_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10818880)))]; tensor hidden_states_3_cast_fp16 = transpose(perm = hidden_states_3_perm_0, x = hidden_states_1_cast_fp16)[name = tensor("transpose_320")]; tensor input_5_cast_fp16 = add(x = hidden_states_3_cast_fp16, y = encoder_embed_positions_weight_to_fp16)[name = tensor("input_5_cast_fp16")]; tensor hidden_states_5_axes_0 = const()[name = tensor("hidden_states_5_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14658944)))]; tensor encoder_layers_0_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14661568)))]; tensor var_4_to_fp16 = const()[name = tensor("op_4_to_fp16"), val = tensor(0x1.5p-17)]; tensor hidden_states_5_cast_fp16 = layer_norm(axes = hidden_states_5_axes_0, beta = encoder_layers_0_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_0_self_attn_layer_norm_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("hidden_states_5_cast_fp16")]; tensor encoder_layers_0_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14664192)))]; tensor encoder_layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17941056)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_layers_0_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_q_proj_weight_to_fp16, x = hidden_states_5_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor encoder_layers_0_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17943680)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21220544)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_0_self_attn_k_proj_weight_to_fp16, x = hidden_states_5_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor encoder_layers_0_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21223168)))]; tensor encoder_layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24500032)))]; tensor linear_2_cast_fp16 = linear(bias = encoder_layers_0_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_v_proj_weight_to_fp16, x = hidden_states_5_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_133 = const()[name = tensor("op_133"), val = tensor([1, 1500, 20, 64])]; tensor var_134_cast_fp16 = reshape(shape = var_133, x = linear_0_cast_fp16)[name = tensor("op_134_cast_fp16")]; tensor var_136 = const()[name = tensor("op_136"), val = tensor([1, 1500, 20, 64])]; tensor var_137_cast_fp16 = reshape(shape = var_136, x = linear_1_cast_fp16)[name = tensor("op_137_cast_fp16")]; tensor var_139 = const()[name = tensor("op_139"), val = tensor([1, 1500, 20, 64])]; tensor var_140_cast_fp16 = reshape(shape = var_139, x = linear_2_cast_fp16)[name = tensor("op_140_cast_fp16")]; tensor value_3_perm_0 = const()[name = tensor("value_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_6_to_fp16 = const()[name = tensor("op_6_to_fp16"), val = tensor(0x1p-3)]; tensor mul_0_cast_fp16 = mul(x = var_134_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_0_cast_fp16")]; tensor matmul_0_transpose_y_0 = const()[name = tensor("matmul_0_transpose_y_0"), val = tensor(true)]; tensor matmul_0_transpose_x_0 = const()[name = tensor("matmul_0_transpose_x_0"), val = tensor(false)]; tensor transpose_128_perm_0 = const()[name = tensor("transpose_128_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129_perm_0 = const()[name = tensor("transpose_129_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129 = transpose(perm = transpose_129_perm_0, x = var_137_cast_fp16)[name = tensor("transpose_317")]; tensor transpose_128 = transpose(perm = transpose_128_perm_0, x = mul_0_cast_fp16)[name = tensor("transpose_318")]; tensor matmul_0_cast_fp16 = matmul(transpose_x = matmul_0_transpose_x_0, transpose_y = matmul_0_transpose_y_0, x = transpose_128, y = transpose_129)[name = tensor("matmul_0_cast_fp16")]; tensor softmax_0_axis_0 = const()[name = tensor("softmax_0_axis_0"), val = tensor(-1)]; tensor softmax_0_cast_fp16 = softmax(axis = softmax_0_axis_0, x = matmul_0_cast_fp16)[name = tensor("softmax_0_cast_fp16")]; tensor attn_output_1_transpose_x_0 = const()[name = tensor("attn_output_1_transpose_x_0"), val = tensor(false)]; tensor attn_output_1_transpose_y_0 = const()[name = tensor("attn_output_1_transpose_y_0"), val = tensor(false)]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = var_140_cast_fp16)[name = tensor("transpose_319")]; tensor attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = softmax_0_cast_fp16, y = value_3_cast_fp16)[name = tensor("attn_output_1_cast_fp16")]; tensor var_143_perm_0 = const()[name = tensor("op_143_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_145 = const()[name = tensor("op_145"), val = tensor([1, 1500, 1280])]; tensor var_143_cast_fp16 = transpose(perm = var_143_perm_0, x = attn_output_1_cast_fp16)[name = tensor("transpose_316")]; tensor input_7_cast_fp16 = reshape(shape = var_145, x = var_143_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor encoder_layers_0_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24502656)))]; tensor encoder_layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27779520)))]; tensor linear_3_cast_fp16 = linear(bias = encoder_layers_0_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_0_self_attn_out_proj_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor input_9_cast_fp16 = add(x = input_5_cast_fp16, y = linear_3_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor input_11_axes_0 = const()[name = tensor("input_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27782144)))]; tensor encoder_layers_0_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27784768)))]; tensor input_11_cast_fp16 = layer_norm(axes = input_11_axes_0, beta = encoder_layers_0_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_0_final_layer_norm_weight_to_fp16, x = input_9_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor encoder_layers_0_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27787392)))]; tensor encoder_layers_0_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40894656)))]; tensor linear_4_cast_fp16 = linear(bias = encoder_layers_0_fc1_bias_to_fp16, weight = encoder_layers_0_fc1_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor input_13_mode_0 = const()[name = tensor("input_13_mode_0"), val = tensor("EXACT")]; tensor input_13_cast_fp16 = gelu(mode = input_13_mode_0, x = linear_4_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor encoder_layers_0_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40904960)))]; tensor encoder_layers_0_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54012224)))]; tensor linear_5_cast_fp16 = linear(bias = encoder_layers_0_fc2_bias_to_fp16, weight = encoder_layers_0_fc2_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor input_15_cast_fp16 = add(x = input_9_cast_fp16, y = linear_5_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor hidden_states_11_axes_0 = const()[name = tensor("hidden_states_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54014848)))]; tensor encoder_layers_1_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54017472)))]; tensor hidden_states_11_cast_fp16 = layer_norm(axes = hidden_states_11_axes_0, beta = encoder_layers_1_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_1_self_attn_layer_norm_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("hidden_states_11_cast_fp16")]; tensor encoder_layers_1_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54020096)))]; tensor encoder_layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57296960)))]; tensor linear_6_cast_fp16 = linear(bias = encoder_layers_1_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_q_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor encoder_layers_1_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57299584)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_1_self_attn_k_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor encoder_layers_1_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60576448)))]; tensor encoder_layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63853312)))]; tensor linear_8_cast_fp16 = linear(bias = encoder_layers_1_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_v_proj_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_186 = const()[name = tensor("op_186"), val = tensor([1, 1500, 20, 64])]; tensor var_187_cast_fp16 = reshape(shape = var_186, x = linear_6_cast_fp16)[name = tensor("op_187_cast_fp16")]; tensor var_189 = const()[name = tensor("op_189"), val = tensor([1, 1500, 20, 64])]; tensor var_190_cast_fp16 = reshape(shape = var_189, x = linear_7_cast_fp16)[name = tensor("op_190_cast_fp16")]; tensor var_192 = const()[name = tensor("op_192"), val = tensor([1, 1500, 20, 64])]; tensor var_193_cast_fp16 = reshape(shape = var_192, x = linear_8_cast_fp16)[name = tensor("op_193_cast_fp16")]; tensor value_7_perm_0 = const()[name = tensor("value_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_1_cast_fp16 = mul(x = var_187_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_1_cast_fp16")]; tensor matmul_1_transpose_y_0 = const()[name = tensor("matmul_1_transpose_y_0"), val = tensor(true)]; tensor matmul_1_transpose_x_0 = const()[name = tensor("matmul_1_transpose_x_0"), val = tensor(false)]; tensor transpose_130_perm_0 = const()[name = tensor("transpose_130_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131_perm_0 = const()[name = tensor("transpose_131_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131 = transpose(perm = transpose_131_perm_0, x = var_190_cast_fp16)[name = tensor("transpose_313")]; tensor transpose_130 = transpose(perm = transpose_130_perm_0, x = mul_1_cast_fp16)[name = tensor("transpose_314")]; tensor matmul_1_cast_fp16 = matmul(transpose_x = matmul_1_transpose_x_0, transpose_y = matmul_1_transpose_y_0, x = transpose_130, y = transpose_131)[name = tensor("matmul_1_cast_fp16")]; tensor softmax_1_axis_0 = const()[name = tensor("softmax_1_axis_0"), val = tensor(-1)]; tensor softmax_1_cast_fp16 = softmax(axis = softmax_1_axis_0, x = matmul_1_cast_fp16)[name = tensor("softmax_1_cast_fp16")]; tensor attn_output_3_transpose_x_0 = const()[name = tensor("attn_output_3_transpose_x_0"), val = tensor(false)]; tensor attn_output_3_transpose_y_0 = const()[name = tensor("attn_output_3_transpose_y_0"), val = tensor(false)]; tensor value_7_cast_fp16 = transpose(perm = value_7_perm_0, x = var_193_cast_fp16)[name = tensor("transpose_315")]; tensor attn_output_3_cast_fp16 = matmul(transpose_x = attn_output_3_transpose_x_0, transpose_y = attn_output_3_transpose_y_0, x = softmax_1_cast_fp16, y = value_7_cast_fp16)[name = tensor("attn_output_3_cast_fp16")]; tensor var_196_perm_0 = const()[name = tensor("op_196_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_198 = const()[name = tensor("op_198"), val = tensor([1, 1500, 1280])]; tensor var_196_cast_fp16 = transpose(perm = var_196_perm_0, x = attn_output_3_cast_fp16)[name = tensor("transpose_312")]; tensor input_17_cast_fp16 = reshape(shape = var_198, x = var_196_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor encoder_layers_1_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63855936)))]; tensor encoder_layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67132800)))]; tensor linear_9_cast_fp16 = linear(bias = encoder_layers_1_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_1_self_attn_out_proj_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor input_19_cast_fp16 = add(x = input_15_cast_fp16, y = linear_9_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_axes_0 = const()[name = tensor("input_21_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67135424)))]; tensor encoder_layers_1_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67138048)))]; tensor input_21_cast_fp16 = layer_norm(axes = input_21_axes_0, beta = encoder_layers_1_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_1_final_layer_norm_weight_to_fp16, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor encoder_layers_1_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67140672)))]; tensor encoder_layers_1_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80247936)))]; tensor linear_10_cast_fp16 = linear(bias = encoder_layers_1_fc1_bias_to_fp16, weight = encoder_layers_1_fc1_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_23_mode_0 = const()[name = tensor("input_23_mode_0"), val = tensor("EXACT")]; tensor input_23_cast_fp16 = gelu(mode = input_23_mode_0, x = linear_10_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor encoder_layers_1_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80258240)))]; tensor encoder_layers_1_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93365504)))]; tensor linear_11_cast_fp16 = linear(bias = encoder_layers_1_fc2_bias_to_fp16, weight = encoder_layers_1_fc2_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor input_25_cast_fp16 = add(x = input_19_cast_fp16, y = linear_11_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor hidden_states_17_axes_0 = const()[name = tensor("hidden_states_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93368128)))]; tensor encoder_layers_2_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93370752)))]; tensor hidden_states_17_cast_fp16 = layer_norm(axes = hidden_states_17_axes_0, beta = encoder_layers_2_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_2_self_attn_layer_norm_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("hidden_states_17_cast_fp16")]; tensor encoder_layers_2_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93373376)))]; tensor encoder_layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96650240)))]; tensor linear_12_cast_fp16 = linear(bias = encoder_layers_2_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_q_proj_weight_to_fp16, x = hidden_states_17_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor encoder_layers_2_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96652864)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_2_self_attn_k_proj_weight_to_fp16, x = hidden_states_17_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor encoder_layers_2_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(99929728)))]; tensor encoder_layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103206592)))]; tensor linear_14_cast_fp16 = linear(bias = encoder_layers_2_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_v_proj_weight_to_fp16, x = hidden_states_17_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_239 = const()[name = tensor("op_239"), val = tensor([1, 1500, 20, 64])]; tensor var_240_cast_fp16 = reshape(shape = var_239, x = linear_12_cast_fp16)[name = tensor("op_240_cast_fp16")]; tensor var_242 = const()[name = tensor("op_242"), val = tensor([1, 1500, 20, 64])]; tensor var_243_cast_fp16 = reshape(shape = var_242, x = linear_13_cast_fp16)[name = tensor("op_243_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor([1, 1500, 20, 64])]; tensor var_246_cast_fp16 = reshape(shape = var_245, x = linear_14_cast_fp16)[name = tensor("op_246_cast_fp16")]; tensor value_11_perm_0 = const()[name = tensor("value_11_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_2_cast_fp16 = mul(x = var_240_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_2_cast_fp16")]; tensor matmul_2_transpose_y_0 = const()[name = tensor("matmul_2_transpose_y_0"), val = tensor(true)]; tensor matmul_2_transpose_x_0 = const()[name = tensor("matmul_2_transpose_x_0"), val = tensor(false)]; tensor transpose_132_perm_0 = const()[name = tensor("transpose_132_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133_perm_0 = const()[name = tensor("transpose_133_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133 = transpose(perm = transpose_133_perm_0, x = var_243_cast_fp16)[name = tensor("transpose_309")]; tensor transpose_132 = transpose(perm = transpose_132_perm_0, x = mul_2_cast_fp16)[name = tensor("transpose_310")]; tensor matmul_2_cast_fp16 = matmul(transpose_x = matmul_2_transpose_x_0, transpose_y = matmul_2_transpose_y_0, x = transpose_132, y = transpose_133)[name = tensor("matmul_2_cast_fp16")]; tensor softmax_2_axis_0 = const()[name = tensor("softmax_2_axis_0"), val = tensor(-1)]; tensor softmax_2_cast_fp16 = softmax(axis = softmax_2_axis_0, x = matmul_2_cast_fp16)[name = tensor("softmax_2_cast_fp16")]; tensor attn_output_5_transpose_x_0 = const()[name = tensor("attn_output_5_transpose_x_0"), val = tensor(false)]; tensor attn_output_5_transpose_y_0 = const()[name = tensor("attn_output_5_transpose_y_0"), val = tensor(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = var_246_cast_fp16)[name = tensor("transpose_311")]; tensor attn_output_5_cast_fp16 = matmul(transpose_x = attn_output_5_transpose_x_0, transpose_y = attn_output_5_transpose_y_0, x = softmax_2_cast_fp16, y = value_11_cast_fp16)[name = tensor("attn_output_5_cast_fp16")]; tensor var_249_perm_0 = const()[name = tensor("op_249_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_251 = const()[name = tensor("op_251"), val = tensor([1, 1500, 1280])]; tensor var_249_cast_fp16 = transpose(perm = var_249_perm_0, x = attn_output_5_cast_fp16)[name = tensor("transpose_308")]; tensor input_27_cast_fp16 = reshape(shape = var_251, x = var_249_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor encoder_layers_2_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103209216)))]; tensor encoder_layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106486080)))]; tensor linear_15_cast_fp16 = linear(bias = encoder_layers_2_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_2_self_attn_out_proj_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor input_29_cast_fp16 = add(x = input_25_cast_fp16, y = linear_15_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor input_31_axes_0 = const()[name = tensor("input_31_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106488704)))]; tensor encoder_layers_2_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106491328)))]; tensor input_31_cast_fp16 = layer_norm(axes = input_31_axes_0, beta = encoder_layers_2_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_2_final_layer_norm_weight_to_fp16, x = input_29_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor encoder_layers_2_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106493952)))]; tensor encoder_layers_2_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119601216)))]; tensor linear_16_cast_fp16 = linear(bias = encoder_layers_2_fc1_bias_to_fp16, weight = encoder_layers_2_fc1_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_33_mode_0 = const()[name = tensor("input_33_mode_0"), val = tensor("EXACT")]; tensor input_33_cast_fp16 = gelu(mode = input_33_mode_0, x = linear_16_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor encoder_layers_2_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119611520)))]; tensor encoder_layers_2_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132718784)))]; tensor linear_17_cast_fp16 = linear(bias = encoder_layers_2_fc2_bias_to_fp16, weight = encoder_layers_2_fc2_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor input_35_cast_fp16 = add(x = input_29_cast_fp16, y = linear_17_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor hidden_states_23_axes_0 = const()[name = tensor("hidden_states_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132721408)))]; tensor encoder_layers_3_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132724032)))]; tensor hidden_states_23_cast_fp16 = layer_norm(axes = hidden_states_23_axes_0, beta = encoder_layers_3_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_3_self_attn_layer_norm_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("hidden_states_23_cast_fp16")]; tensor encoder_layers_3_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132726656)))]; tensor encoder_layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136003520)))]; tensor linear_18_cast_fp16 = linear(bias = encoder_layers_3_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_q_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor encoder_layers_3_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136006144)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_3_self_attn_k_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor encoder_layers_3_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139283008)))]; tensor encoder_layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142559872)))]; tensor linear_20_cast_fp16 = linear(bias = encoder_layers_3_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_v_proj_weight_to_fp16, x = hidden_states_23_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_292 = const()[name = tensor("op_292"), val = tensor([1, 1500, 20, 64])]; tensor var_293_cast_fp16 = reshape(shape = var_292, x = linear_18_cast_fp16)[name = tensor("op_293_cast_fp16")]; tensor var_295 = const()[name = tensor("op_295"), val = tensor([1, 1500, 20, 64])]; tensor var_296_cast_fp16 = reshape(shape = var_295, x = linear_19_cast_fp16)[name = tensor("op_296_cast_fp16")]; tensor var_298 = const()[name = tensor("op_298"), val = tensor([1, 1500, 20, 64])]; tensor var_299_cast_fp16 = reshape(shape = var_298, x = linear_20_cast_fp16)[name = tensor("op_299_cast_fp16")]; tensor value_15_perm_0 = const()[name = tensor("value_15_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_3_cast_fp16 = mul(x = var_293_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_3_cast_fp16")]; tensor matmul_3_transpose_y_0 = const()[name = tensor("matmul_3_transpose_y_0"), val = tensor(true)]; tensor matmul_3_transpose_x_0 = const()[name = tensor("matmul_3_transpose_x_0"), val = tensor(false)]; tensor transpose_134_perm_0 = const()[name = tensor("transpose_134_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135_perm_0 = const()[name = tensor("transpose_135_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135 = transpose(perm = transpose_135_perm_0, x = var_296_cast_fp16)[name = tensor("transpose_305")]; tensor transpose_134 = transpose(perm = transpose_134_perm_0, x = mul_3_cast_fp16)[name = tensor("transpose_306")]; tensor matmul_3_cast_fp16 = matmul(transpose_x = matmul_3_transpose_x_0, transpose_y = matmul_3_transpose_y_0, x = transpose_134, y = transpose_135)[name = tensor("matmul_3_cast_fp16")]; tensor softmax_3_axis_0 = const()[name = tensor("softmax_3_axis_0"), val = tensor(-1)]; tensor softmax_3_cast_fp16 = softmax(axis = softmax_3_axis_0, x = matmul_3_cast_fp16)[name = tensor("softmax_3_cast_fp16")]; tensor attn_output_7_transpose_x_0 = const()[name = tensor("attn_output_7_transpose_x_0"), val = tensor(false)]; tensor attn_output_7_transpose_y_0 = const()[name = tensor("attn_output_7_transpose_y_0"), val = tensor(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = var_299_cast_fp16)[name = tensor("transpose_307")]; tensor attn_output_7_cast_fp16 = matmul(transpose_x = attn_output_7_transpose_x_0, transpose_y = attn_output_7_transpose_y_0, x = softmax_3_cast_fp16, y = value_15_cast_fp16)[name = tensor("attn_output_7_cast_fp16")]; tensor var_302_perm_0 = const()[name = tensor("op_302_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_304 = const()[name = tensor("op_304"), val = tensor([1, 1500, 1280])]; tensor var_302_cast_fp16 = transpose(perm = var_302_perm_0, x = attn_output_7_cast_fp16)[name = tensor("transpose_304")]; tensor input_37_cast_fp16 = reshape(shape = var_304, x = var_302_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor encoder_layers_3_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142562496)))]; tensor encoder_layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145839360)))]; tensor linear_21_cast_fp16 = linear(bias = encoder_layers_3_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_3_self_attn_out_proj_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor input_39_cast_fp16 = add(x = input_35_cast_fp16, y = linear_21_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_41_axes_0 = const()[name = tensor("input_41_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145841984)))]; tensor encoder_layers_3_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145844608)))]; tensor input_41_cast_fp16 = layer_norm(axes = input_41_axes_0, beta = encoder_layers_3_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_3_final_layer_norm_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor encoder_layers_3_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145847232)))]; tensor encoder_layers_3_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158954496)))]; tensor linear_22_cast_fp16 = linear(bias = encoder_layers_3_fc1_bias_to_fp16, weight = encoder_layers_3_fc1_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor input_43_mode_0 = const()[name = tensor("input_43_mode_0"), val = tensor("EXACT")]; tensor input_43_cast_fp16 = gelu(mode = input_43_mode_0, x = linear_22_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor encoder_layers_3_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158964800)))]; tensor encoder_layers_3_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172072064)))]; tensor linear_23_cast_fp16 = linear(bias = encoder_layers_3_fc2_bias_to_fp16, weight = encoder_layers_3_fc2_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor input_45_cast_fp16 = add(x = input_39_cast_fp16, y = linear_23_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor hidden_states_29_axes_0 = const()[name = tensor("hidden_states_29_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172074688)))]; tensor encoder_layers_4_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172077312)))]; tensor hidden_states_29_cast_fp16 = layer_norm(axes = hidden_states_29_axes_0, beta = encoder_layers_4_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_4_self_attn_layer_norm_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("hidden_states_29_cast_fp16")]; tensor encoder_layers_4_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172079936)))]; tensor encoder_layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175356800)))]; tensor linear_24_cast_fp16 = linear(bias = encoder_layers_4_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_q_proj_weight_to_fp16, x = hidden_states_29_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor encoder_layers_4_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175359424)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_4_self_attn_k_proj_weight_to_fp16, x = hidden_states_29_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor encoder_layers_4_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178636288)))]; tensor encoder_layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181913152)))]; tensor linear_26_cast_fp16 = linear(bias = encoder_layers_4_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_v_proj_weight_to_fp16, x = hidden_states_29_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor var_345 = const()[name = tensor("op_345"), val = tensor([1, 1500, 20, 64])]; tensor var_346_cast_fp16 = reshape(shape = var_345, x = linear_24_cast_fp16)[name = tensor("op_346_cast_fp16")]; tensor var_348 = const()[name = tensor("op_348"), val = tensor([1, 1500, 20, 64])]; tensor var_349_cast_fp16 = reshape(shape = var_348, x = linear_25_cast_fp16)[name = tensor("op_349_cast_fp16")]; tensor var_351 = const()[name = tensor("op_351"), val = tensor([1, 1500, 20, 64])]; tensor var_352_cast_fp16 = reshape(shape = var_351, x = linear_26_cast_fp16)[name = tensor("op_352_cast_fp16")]; tensor value_19_perm_0 = const()[name = tensor("value_19_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_4_cast_fp16 = mul(x = var_346_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_4_cast_fp16")]; tensor matmul_4_transpose_y_0 = const()[name = tensor("matmul_4_transpose_y_0"), val = tensor(true)]; tensor matmul_4_transpose_x_0 = const()[name = tensor("matmul_4_transpose_x_0"), val = tensor(false)]; tensor transpose_136_perm_0 = const()[name = tensor("transpose_136_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137_perm_0 = const()[name = tensor("transpose_137_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137 = transpose(perm = transpose_137_perm_0, x = var_349_cast_fp16)[name = tensor("transpose_301")]; tensor transpose_136 = transpose(perm = transpose_136_perm_0, x = mul_4_cast_fp16)[name = tensor("transpose_302")]; tensor matmul_4_cast_fp16 = matmul(transpose_x = matmul_4_transpose_x_0, transpose_y = matmul_4_transpose_y_0, x = transpose_136, y = transpose_137)[name = tensor("matmul_4_cast_fp16")]; tensor softmax_4_axis_0 = const()[name = tensor("softmax_4_axis_0"), val = tensor(-1)]; tensor softmax_4_cast_fp16 = softmax(axis = softmax_4_axis_0, x = matmul_4_cast_fp16)[name = tensor("softmax_4_cast_fp16")]; tensor attn_output_9_transpose_x_0 = const()[name = tensor("attn_output_9_transpose_x_0"), val = tensor(false)]; tensor attn_output_9_transpose_y_0 = const()[name = tensor("attn_output_9_transpose_y_0"), val = tensor(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = var_352_cast_fp16)[name = tensor("transpose_303")]; tensor attn_output_9_cast_fp16 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = softmax_4_cast_fp16, y = value_19_cast_fp16)[name = tensor("attn_output_9_cast_fp16")]; tensor var_355_perm_0 = const()[name = tensor("op_355_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_357 = const()[name = tensor("op_357"), val = tensor([1, 1500, 1280])]; tensor var_355_cast_fp16 = transpose(perm = var_355_perm_0, x = attn_output_9_cast_fp16)[name = tensor("transpose_300")]; tensor input_47_cast_fp16 = reshape(shape = var_357, x = var_355_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor encoder_layers_4_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181915776)))]; tensor encoder_layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185192640)))]; tensor linear_27_cast_fp16 = linear(bias = encoder_layers_4_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_4_self_attn_out_proj_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor input_49_cast_fp16 = add(x = input_45_cast_fp16, y = linear_27_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor input_51_axes_0 = const()[name = tensor("input_51_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185195264)))]; tensor encoder_layers_4_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185197888)))]; tensor input_51_cast_fp16 = layer_norm(axes = input_51_axes_0, beta = encoder_layers_4_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_4_final_layer_norm_weight_to_fp16, x = input_49_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor encoder_layers_4_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185200512)))]; tensor encoder_layers_4_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198307776)))]; tensor linear_28_cast_fp16 = linear(bias = encoder_layers_4_fc1_bias_to_fp16, weight = encoder_layers_4_fc1_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor input_53_mode_0 = const()[name = tensor("input_53_mode_0"), val = tensor("EXACT")]; tensor input_53_cast_fp16 = gelu(mode = input_53_mode_0, x = linear_28_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor encoder_layers_4_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198318080)))]; tensor encoder_layers_4_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211425344)))]; tensor linear_29_cast_fp16 = linear(bias = encoder_layers_4_fc2_bias_to_fp16, weight = encoder_layers_4_fc2_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor input_55_cast_fp16 = add(x = input_49_cast_fp16, y = linear_29_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor hidden_states_35_axes_0 = const()[name = tensor("hidden_states_35_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211427968)))]; tensor encoder_layers_5_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211430592)))]; tensor hidden_states_35_cast_fp16 = layer_norm(axes = hidden_states_35_axes_0, beta = encoder_layers_5_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_5_self_attn_layer_norm_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("hidden_states_35_cast_fp16")]; tensor encoder_layers_5_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211433216)))]; tensor encoder_layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214710080)))]; tensor linear_30_cast_fp16 = linear(bias = encoder_layers_5_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_q_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor encoder_layers_5_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214712704)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_5_self_attn_k_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor encoder_layers_5_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217989568)))]; tensor encoder_layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221266432)))]; tensor linear_32_cast_fp16 = linear(bias = encoder_layers_5_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_v_proj_weight_to_fp16, x = hidden_states_35_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_398 = const()[name = tensor("op_398"), val = tensor([1, 1500, 20, 64])]; tensor var_399_cast_fp16 = reshape(shape = var_398, x = linear_30_cast_fp16)[name = tensor("op_399_cast_fp16")]; tensor var_401 = const()[name = tensor("op_401"), val = tensor([1, 1500, 20, 64])]; tensor var_402_cast_fp16 = reshape(shape = var_401, x = linear_31_cast_fp16)[name = tensor("op_402_cast_fp16")]; tensor var_404 = const()[name = tensor("op_404"), val = tensor([1, 1500, 20, 64])]; tensor var_405_cast_fp16 = reshape(shape = var_404, x = linear_32_cast_fp16)[name = tensor("op_405_cast_fp16")]; tensor value_23_perm_0 = const()[name = tensor("value_23_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_5_cast_fp16 = mul(x = var_399_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_5_cast_fp16")]; tensor matmul_5_transpose_y_0 = const()[name = tensor("matmul_5_transpose_y_0"), val = tensor(true)]; tensor matmul_5_transpose_x_0 = const()[name = tensor("matmul_5_transpose_x_0"), val = tensor(false)]; tensor transpose_138_perm_0 = const()[name = tensor("transpose_138_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139_perm_0 = const()[name = tensor("transpose_139_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139 = transpose(perm = transpose_139_perm_0, x = var_402_cast_fp16)[name = tensor("transpose_297")]; tensor transpose_138 = transpose(perm = transpose_138_perm_0, x = mul_5_cast_fp16)[name = tensor("transpose_298")]; tensor matmul_5_cast_fp16 = matmul(transpose_x = matmul_5_transpose_x_0, transpose_y = matmul_5_transpose_y_0, x = transpose_138, y = transpose_139)[name = tensor("matmul_5_cast_fp16")]; tensor softmax_5_axis_0 = const()[name = tensor("softmax_5_axis_0"), val = tensor(-1)]; tensor softmax_5_cast_fp16 = softmax(axis = softmax_5_axis_0, x = matmul_5_cast_fp16)[name = tensor("softmax_5_cast_fp16")]; tensor attn_output_11_transpose_x_0 = const()[name = tensor("attn_output_11_transpose_x_0"), val = tensor(false)]; tensor attn_output_11_transpose_y_0 = const()[name = tensor("attn_output_11_transpose_y_0"), val = tensor(false)]; tensor value_23_cast_fp16 = transpose(perm = value_23_perm_0, x = var_405_cast_fp16)[name = tensor("transpose_299")]; tensor attn_output_11_cast_fp16 = matmul(transpose_x = attn_output_11_transpose_x_0, transpose_y = attn_output_11_transpose_y_0, x = softmax_5_cast_fp16, y = value_23_cast_fp16)[name = tensor("attn_output_11_cast_fp16")]; tensor var_408_perm_0 = const()[name = tensor("op_408_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_410 = const()[name = tensor("op_410"), val = tensor([1, 1500, 1280])]; tensor var_408_cast_fp16 = transpose(perm = var_408_perm_0, x = attn_output_11_cast_fp16)[name = tensor("transpose_296")]; tensor input_57_cast_fp16 = reshape(shape = var_410, x = var_408_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor encoder_layers_5_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221269056)))]; tensor encoder_layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224545920)))]; tensor linear_33_cast_fp16 = linear(bias = encoder_layers_5_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_5_self_attn_out_proj_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor input_59_cast_fp16 = add(x = input_55_cast_fp16, y = linear_33_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor input_61_axes_0 = const()[name = tensor("input_61_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224548544)))]; tensor encoder_layers_5_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224551168)))]; tensor input_61_cast_fp16 = layer_norm(axes = input_61_axes_0, beta = encoder_layers_5_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_5_final_layer_norm_weight_to_fp16, x = input_59_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor encoder_layers_5_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224553792)))]; tensor encoder_layers_5_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237661056)))]; tensor linear_34_cast_fp16 = linear(bias = encoder_layers_5_fc1_bias_to_fp16, weight = encoder_layers_5_fc1_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_63_mode_0 = const()[name = tensor("input_63_mode_0"), val = tensor("EXACT")]; tensor input_63_cast_fp16 = gelu(mode = input_63_mode_0, x = linear_34_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor encoder_layers_5_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237671360)))]; tensor encoder_layers_5_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250778624)))]; tensor linear_35_cast_fp16 = linear(bias = encoder_layers_5_fc2_bias_to_fp16, weight = encoder_layers_5_fc2_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_65_cast_fp16 = add(x = input_59_cast_fp16, y = linear_35_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor hidden_states_41_axes_0 = const()[name = tensor("hidden_states_41_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250781248)))]; tensor encoder_layers_6_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250783872)))]; tensor hidden_states_41_cast_fp16 = layer_norm(axes = hidden_states_41_axes_0, beta = encoder_layers_6_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_6_self_attn_layer_norm_weight_to_fp16, x = input_65_cast_fp16)[name = tensor("hidden_states_41_cast_fp16")]; tensor encoder_layers_6_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250786496)))]; tensor encoder_layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254063360)))]; tensor linear_36_cast_fp16 = linear(bias = encoder_layers_6_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_q_proj_weight_to_fp16, x = hidden_states_41_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor encoder_layers_6_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254065984)))]; tensor linear_37_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_6_self_attn_k_proj_weight_to_fp16, x = hidden_states_41_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor encoder_layers_6_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257342848)))]; tensor encoder_layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(260619712)))]; tensor linear_38_cast_fp16 = linear(bias = encoder_layers_6_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_v_proj_weight_to_fp16, x = hidden_states_41_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_451 = const()[name = tensor("op_451"), val = tensor([1, 1500, 20, 64])]; tensor var_452_cast_fp16 = reshape(shape = var_451, x = linear_36_cast_fp16)[name = tensor("op_452_cast_fp16")]; tensor var_454 = const()[name = tensor("op_454"), val = tensor([1, 1500, 20, 64])]; tensor var_455_cast_fp16 = reshape(shape = var_454, x = linear_37_cast_fp16)[name = tensor("op_455_cast_fp16")]; tensor var_457 = const()[name = tensor("op_457"), val = tensor([1, 1500, 20, 64])]; tensor var_458_cast_fp16 = reshape(shape = var_457, x = linear_38_cast_fp16)[name = tensor("op_458_cast_fp16")]; tensor value_27_perm_0 = const()[name = tensor("value_27_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_6_cast_fp16 = mul(x = var_452_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_6_cast_fp16")]; tensor matmul_6_transpose_y_0 = const()[name = tensor("matmul_6_transpose_y_0"), val = tensor(true)]; tensor matmul_6_transpose_x_0 = const()[name = tensor("matmul_6_transpose_x_0"), val = tensor(false)]; tensor transpose_140_perm_0 = const()[name = tensor("transpose_140_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141_perm_0 = const()[name = tensor("transpose_141_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141 = transpose(perm = transpose_141_perm_0, x = var_455_cast_fp16)[name = tensor("transpose_293")]; tensor transpose_140 = transpose(perm = transpose_140_perm_0, x = mul_6_cast_fp16)[name = tensor("transpose_294")]; tensor matmul_6_cast_fp16 = matmul(transpose_x = matmul_6_transpose_x_0, transpose_y = matmul_6_transpose_y_0, x = transpose_140, y = transpose_141)[name = tensor("matmul_6_cast_fp16")]; tensor softmax_6_axis_0 = const()[name = tensor("softmax_6_axis_0"), val = tensor(-1)]; tensor softmax_6_cast_fp16 = softmax(axis = softmax_6_axis_0, x = matmul_6_cast_fp16)[name = tensor("softmax_6_cast_fp16")]; tensor attn_output_13_transpose_x_0 = const()[name = tensor("attn_output_13_transpose_x_0"), val = tensor(false)]; tensor attn_output_13_transpose_y_0 = const()[name = tensor("attn_output_13_transpose_y_0"), val = tensor(false)]; tensor value_27_cast_fp16 = transpose(perm = value_27_perm_0, x = var_458_cast_fp16)[name = tensor("transpose_295")]; tensor attn_output_13_cast_fp16 = matmul(transpose_x = attn_output_13_transpose_x_0, transpose_y = attn_output_13_transpose_y_0, x = softmax_6_cast_fp16, y = value_27_cast_fp16)[name = tensor("attn_output_13_cast_fp16")]; tensor var_461_perm_0 = const()[name = tensor("op_461_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_463 = const()[name = tensor("op_463"), val = tensor([1, 1500, 1280])]; tensor var_461_cast_fp16 = transpose(perm = var_461_perm_0, x = attn_output_13_cast_fp16)[name = tensor("transpose_292")]; tensor input_67_cast_fp16 = reshape(shape = var_463, x = var_461_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor encoder_layers_6_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(260622336)))]; tensor encoder_layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263899200)))]; tensor linear_39_cast_fp16 = linear(bias = encoder_layers_6_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_6_self_attn_out_proj_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor input_69_cast_fp16 = add(x = input_65_cast_fp16, y = linear_39_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor input_71_axes_0 = const()[name = tensor("input_71_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263901824)))]; tensor encoder_layers_6_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263904448)))]; tensor input_71_cast_fp16 = layer_norm(axes = input_71_axes_0, beta = encoder_layers_6_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_6_final_layer_norm_weight_to_fp16, x = input_69_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor encoder_layers_6_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263907072)))]; tensor encoder_layers_6_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277014336)))]; tensor linear_40_cast_fp16 = linear(bias = encoder_layers_6_fc1_bias_to_fp16, weight = encoder_layers_6_fc1_weight_to_fp16, x = input_71_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor input_73_mode_0 = const()[name = tensor("input_73_mode_0"), val = tensor("EXACT")]; tensor input_73_cast_fp16 = gelu(mode = input_73_mode_0, x = linear_40_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor encoder_layers_6_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277024640)))]; tensor encoder_layers_6_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290131904)))]; tensor linear_41_cast_fp16 = linear(bias = encoder_layers_6_fc2_bias_to_fp16, weight = encoder_layers_6_fc2_weight_to_fp16, x = input_73_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_69_cast_fp16, y = linear_41_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor hidden_states_47_axes_0 = const()[name = tensor("hidden_states_47_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290134528)))]; tensor encoder_layers_7_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290137152)))]; tensor hidden_states_47_cast_fp16 = layer_norm(axes = hidden_states_47_axes_0, beta = encoder_layers_7_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_7_self_attn_layer_norm_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("hidden_states_47_cast_fp16")]; tensor encoder_layers_7_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290139776)))]; tensor encoder_layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293416640)))]; tensor linear_42_cast_fp16 = linear(bias = encoder_layers_7_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_q_proj_weight_to_fp16, x = hidden_states_47_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor encoder_layers_7_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293419264)))]; tensor linear_43_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_7_self_attn_k_proj_weight_to_fp16, x = hidden_states_47_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor encoder_layers_7_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296696128)))]; tensor encoder_layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299972992)))]; tensor linear_44_cast_fp16 = linear(bias = encoder_layers_7_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_v_proj_weight_to_fp16, x = hidden_states_47_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor var_504 = const()[name = tensor("op_504"), val = tensor([1, 1500, 20, 64])]; tensor var_505_cast_fp16 = reshape(shape = var_504, x = linear_42_cast_fp16)[name = tensor("op_505_cast_fp16")]; tensor var_507 = const()[name = tensor("op_507"), val = tensor([1, 1500, 20, 64])]; tensor var_508_cast_fp16 = reshape(shape = var_507, x = linear_43_cast_fp16)[name = tensor("op_508_cast_fp16")]; tensor var_510 = const()[name = tensor("op_510"), val = tensor([1, 1500, 20, 64])]; tensor var_511_cast_fp16 = reshape(shape = var_510, x = linear_44_cast_fp16)[name = tensor("op_511_cast_fp16")]; tensor value_31_perm_0 = const()[name = tensor("value_31_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_7_cast_fp16 = mul(x = var_505_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_7_cast_fp16")]; tensor matmul_7_transpose_y_0 = const()[name = tensor("matmul_7_transpose_y_0"), val = tensor(true)]; tensor matmul_7_transpose_x_0 = const()[name = tensor("matmul_7_transpose_x_0"), val = tensor(false)]; tensor transpose_142_perm_0 = const()[name = tensor("transpose_142_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143_perm_0 = const()[name = tensor("transpose_143_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143 = transpose(perm = transpose_143_perm_0, x = var_508_cast_fp16)[name = tensor("transpose_289")]; tensor transpose_142 = transpose(perm = transpose_142_perm_0, x = mul_7_cast_fp16)[name = tensor("transpose_290")]; tensor matmul_7_cast_fp16 = matmul(transpose_x = matmul_7_transpose_x_0, transpose_y = matmul_7_transpose_y_0, x = transpose_142, y = transpose_143)[name = tensor("matmul_7_cast_fp16")]; tensor softmax_7_axis_0 = const()[name = tensor("softmax_7_axis_0"), val = tensor(-1)]; tensor softmax_7_cast_fp16 = softmax(axis = softmax_7_axis_0, x = matmul_7_cast_fp16)[name = tensor("softmax_7_cast_fp16")]; tensor attn_output_15_transpose_x_0 = const()[name = tensor("attn_output_15_transpose_x_0"), val = tensor(false)]; tensor attn_output_15_transpose_y_0 = const()[name = tensor("attn_output_15_transpose_y_0"), val = tensor(false)]; tensor value_31_cast_fp16 = transpose(perm = value_31_perm_0, x = var_511_cast_fp16)[name = tensor("transpose_291")]; tensor attn_output_15_cast_fp16 = matmul(transpose_x = attn_output_15_transpose_x_0, transpose_y = attn_output_15_transpose_y_0, x = softmax_7_cast_fp16, y = value_31_cast_fp16)[name = tensor("attn_output_15_cast_fp16")]; tensor var_514_perm_0 = const()[name = tensor("op_514_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_516 = const()[name = tensor("op_516"), val = tensor([1, 1500, 1280])]; tensor var_514_cast_fp16 = transpose(perm = var_514_perm_0, x = attn_output_15_cast_fp16)[name = tensor("transpose_288")]; tensor input_77_cast_fp16 = reshape(shape = var_516, x = var_514_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor encoder_layers_7_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299975616)))]; tensor encoder_layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303252480)))]; tensor linear_45_cast_fp16 = linear(bias = encoder_layers_7_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_7_self_attn_out_proj_weight_to_fp16, x = input_77_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor input_79_cast_fp16 = add(x = input_75_cast_fp16, y = linear_45_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor input_81_axes_0 = const()[name = tensor("input_81_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303255104)))]; tensor encoder_layers_7_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303257728)))]; tensor input_81_cast_fp16 = layer_norm(axes = input_81_axes_0, beta = encoder_layers_7_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_7_final_layer_norm_weight_to_fp16, x = input_79_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor encoder_layers_7_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303260352)))]; tensor encoder_layers_7_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316367616)))]; tensor linear_46_cast_fp16 = linear(bias = encoder_layers_7_fc1_bias_to_fp16, weight = encoder_layers_7_fc1_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_83_mode_0 = const()[name = tensor("input_83_mode_0"), val = tensor("EXACT")]; tensor input_83_cast_fp16 = gelu(mode = input_83_mode_0, x = linear_46_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor encoder_layers_7_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316377920)))]; tensor encoder_layers_7_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329485184)))]; tensor linear_47_cast_fp16 = linear(bias = encoder_layers_7_fc2_bias_to_fp16, weight = encoder_layers_7_fc2_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor input_85_cast_fp16 = add(x = input_79_cast_fp16, y = linear_47_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor hidden_states_53_axes_0 = const()[name = tensor("hidden_states_53_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329487808)))]; tensor encoder_layers_8_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329490432)))]; tensor hidden_states_53_cast_fp16 = layer_norm(axes = hidden_states_53_axes_0, beta = encoder_layers_8_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_8_self_attn_layer_norm_weight_to_fp16, x = input_85_cast_fp16)[name = tensor("hidden_states_53_cast_fp16")]; tensor encoder_layers_8_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329493056)))]; tensor encoder_layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332769920)))]; tensor linear_48_cast_fp16 = linear(bias = encoder_layers_8_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_q_proj_weight_to_fp16, x = hidden_states_53_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor encoder_layers_8_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332772544)))]; tensor linear_49_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_8_self_attn_k_proj_weight_to_fp16, x = hidden_states_53_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor encoder_layers_8_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336049408)))]; tensor encoder_layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339326272)))]; tensor linear_50_cast_fp16 = linear(bias = encoder_layers_8_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_v_proj_weight_to_fp16, x = hidden_states_53_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1500, 20, 64])]; tensor var_558_cast_fp16 = reshape(shape = var_557, x = linear_48_cast_fp16)[name = tensor("op_558_cast_fp16")]; tensor var_560 = const()[name = tensor("op_560"), val = tensor([1, 1500, 20, 64])]; tensor var_561_cast_fp16 = reshape(shape = var_560, x = linear_49_cast_fp16)[name = tensor("op_561_cast_fp16")]; tensor var_563 = const()[name = tensor("op_563"), val = tensor([1, 1500, 20, 64])]; tensor var_564_cast_fp16 = reshape(shape = var_563, x = linear_50_cast_fp16)[name = tensor("op_564_cast_fp16")]; tensor value_35_perm_0 = const()[name = tensor("value_35_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_8_cast_fp16 = mul(x = var_558_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_8_cast_fp16")]; tensor matmul_8_transpose_y_0 = const()[name = tensor("matmul_8_transpose_y_0"), val = tensor(true)]; tensor matmul_8_transpose_x_0 = const()[name = tensor("matmul_8_transpose_x_0"), val = tensor(false)]; tensor transpose_144_perm_0 = const()[name = tensor("transpose_144_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_145_perm_0 = const()[name = tensor("transpose_145_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_145 = transpose(perm = transpose_145_perm_0, x = var_561_cast_fp16)[name = tensor("transpose_285")]; tensor transpose_144 = transpose(perm = transpose_144_perm_0, x = mul_8_cast_fp16)[name = tensor("transpose_286")]; tensor matmul_8_cast_fp16 = matmul(transpose_x = matmul_8_transpose_x_0, transpose_y = matmul_8_transpose_y_0, x = transpose_144, y = transpose_145)[name = tensor("matmul_8_cast_fp16")]; tensor softmax_8_axis_0 = const()[name = tensor("softmax_8_axis_0"), val = tensor(-1)]; tensor softmax_8_cast_fp16 = softmax(axis = softmax_8_axis_0, x = matmul_8_cast_fp16)[name = tensor("softmax_8_cast_fp16")]; tensor attn_output_17_transpose_x_0 = const()[name = tensor("attn_output_17_transpose_x_0"), val = tensor(false)]; tensor attn_output_17_transpose_y_0 = const()[name = tensor("attn_output_17_transpose_y_0"), val = tensor(false)]; tensor value_35_cast_fp16 = transpose(perm = value_35_perm_0, x = var_564_cast_fp16)[name = tensor("transpose_287")]; tensor attn_output_17_cast_fp16 = matmul(transpose_x = attn_output_17_transpose_x_0, transpose_y = attn_output_17_transpose_y_0, x = softmax_8_cast_fp16, y = value_35_cast_fp16)[name = tensor("attn_output_17_cast_fp16")]; tensor var_567_perm_0 = const()[name = tensor("op_567_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_569 = const()[name = tensor("op_569"), val = tensor([1, 1500, 1280])]; tensor var_567_cast_fp16 = transpose(perm = var_567_perm_0, x = attn_output_17_cast_fp16)[name = tensor("transpose_284")]; tensor input_87_cast_fp16 = reshape(shape = var_569, x = var_567_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor encoder_layers_8_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339328896)))]; tensor encoder_layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342605760)))]; tensor linear_51_cast_fp16 = linear(bias = encoder_layers_8_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_8_self_attn_out_proj_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor input_89_cast_fp16 = add(x = input_85_cast_fp16, y = linear_51_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor input_91_axes_0 = const()[name = tensor("input_91_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342608384)))]; tensor encoder_layers_8_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342611008)))]; tensor input_91_cast_fp16 = layer_norm(axes = input_91_axes_0, beta = encoder_layers_8_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_8_final_layer_norm_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("input_91_cast_fp16")]; tensor encoder_layers_8_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342613632)))]; tensor encoder_layers_8_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355720896)))]; tensor linear_52_cast_fp16 = linear(bias = encoder_layers_8_fc1_bias_to_fp16, weight = encoder_layers_8_fc1_weight_to_fp16, x = input_91_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor input_93_mode_0 = const()[name = tensor("input_93_mode_0"), val = tensor("EXACT")]; tensor input_93_cast_fp16 = gelu(mode = input_93_mode_0, x = linear_52_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor encoder_layers_8_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355731200)))]; tensor encoder_layers_8_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368838464)))]; tensor linear_53_cast_fp16 = linear(bias = encoder_layers_8_fc2_bias_to_fp16, weight = encoder_layers_8_fc2_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor input_95_cast_fp16 = add(x = input_89_cast_fp16, y = linear_53_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor hidden_states_59_axes_0 = const()[name = tensor("hidden_states_59_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368841088)))]; tensor encoder_layers_9_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368843712)))]; tensor hidden_states_59_cast_fp16 = layer_norm(axes = hidden_states_59_axes_0, beta = encoder_layers_9_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_9_self_attn_layer_norm_weight_to_fp16, x = input_95_cast_fp16)[name = tensor("hidden_states_59_cast_fp16")]; tensor encoder_layers_9_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368846336)))]; tensor encoder_layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372123200)))]; tensor linear_54_cast_fp16 = linear(bias = encoder_layers_9_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_q_proj_weight_to_fp16, x = hidden_states_59_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor encoder_layers_9_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372125824)))]; tensor linear_55_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_9_self_attn_k_proj_weight_to_fp16, x = hidden_states_59_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor encoder_layers_9_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(375402688)))]; tensor encoder_layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378679552)))]; tensor linear_56_cast_fp16 = linear(bias = encoder_layers_9_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_v_proj_weight_to_fp16, x = hidden_states_59_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor var_610 = const()[name = tensor("op_610"), val = tensor([1, 1500, 20, 64])]; tensor var_611_cast_fp16 = reshape(shape = var_610, x = linear_54_cast_fp16)[name = tensor("op_611_cast_fp16")]; tensor var_613 = const()[name = tensor("op_613"), val = tensor([1, 1500, 20, 64])]; tensor var_614_cast_fp16 = reshape(shape = var_613, x = linear_55_cast_fp16)[name = tensor("op_614_cast_fp16")]; tensor var_616 = const()[name = tensor("op_616"), val = tensor([1, 1500, 20, 64])]; tensor var_617_cast_fp16 = reshape(shape = var_616, x = linear_56_cast_fp16)[name = tensor("op_617_cast_fp16")]; tensor value_39_perm_0 = const()[name = tensor("value_39_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_9_cast_fp16 = mul(x = var_611_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_9_cast_fp16")]; tensor matmul_9_transpose_y_0 = const()[name = tensor("matmul_9_transpose_y_0"), val = tensor(true)]; tensor matmul_9_transpose_x_0 = const()[name = tensor("matmul_9_transpose_x_0"), val = tensor(false)]; tensor transpose_146_perm_0 = const()[name = tensor("transpose_146_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_147_perm_0 = const()[name = tensor("transpose_147_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_147 = transpose(perm = transpose_147_perm_0, x = var_614_cast_fp16)[name = tensor("transpose_281")]; tensor transpose_146 = transpose(perm = transpose_146_perm_0, x = mul_9_cast_fp16)[name = tensor("transpose_282")]; tensor matmul_9_cast_fp16 = matmul(transpose_x = matmul_9_transpose_x_0, transpose_y = matmul_9_transpose_y_0, x = transpose_146, y = transpose_147)[name = tensor("matmul_9_cast_fp16")]; tensor softmax_9_axis_0 = const()[name = tensor("softmax_9_axis_0"), val = tensor(-1)]; tensor softmax_9_cast_fp16 = softmax(axis = softmax_9_axis_0, x = matmul_9_cast_fp16)[name = tensor("softmax_9_cast_fp16")]; tensor attn_output_19_transpose_x_0 = const()[name = tensor("attn_output_19_transpose_x_0"), val = tensor(false)]; tensor attn_output_19_transpose_y_0 = const()[name = tensor("attn_output_19_transpose_y_0"), val = tensor(false)]; tensor value_39_cast_fp16 = transpose(perm = value_39_perm_0, x = var_617_cast_fp16)[name = tensor("transpose_283")]; tensor attn_output_19_cast_fp16 = matmul(transpose_x = attn_output_19_transpose_x_0, transpose_y = attn_output_19_transpose_y_0, x = softmax_9_cast_fp16, y = value_39_cast_fp16)[name = tensor("attn_output_19_cast_fp16")]; tensor var_620_perm_0 = const()[name = tensor("op_620_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_622 = const()[name = tensor("op_622"), val = tensor([1, 1500, 1280])]; tensor var_620_cast_fp16 = transpose(perm = var_620_perm_0, x = attn_output_19_cast_fp16)[name = tensor("transpose_280")]; tensor input_97_cast_fp16 = reshape(shape = var_622, x = var_620_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor encoder_layers_9_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378682176)))]; tensor encoder_layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381959040)))]; tensor linear_57_cast_fp16 = linear(bias = encoder_layers_9_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_9_self_attn_out_proj_weight_to_fp16, x = input_97_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_95_cast_fp16, y = linear_57_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor input_101_axes_0 = const()[name = tensor("input_101_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381961664)))]; tensor encoder_layers_9_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381964288)))]; tensor input_101_cast_fp16 = layer_norm(axes = input_101_axes_0, beta = encoder_layers_9_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_9_final_layer_norm_weight_to_fp16, x = input_99_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor encoder_layers_9_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381966912)))]; tensor encoder_layers_9_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395074176)))]; tensor linear_58_cast_fp16 = linear(bias = encoder_layers_9_fc1_bias_to_fp16, weight = encoder_layers_9_fc1_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor input_103_mode_0 = const()[name = tensor("input_103_mode_0"), val = tensor("EXACT")]; tensor input_103_cast_fp16 = gelu(mode = input_103_mode_0, x = linear_58_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor encoder_layers_9_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395084480)))]; tensor encoder_layers_9_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408191744)))]; tensor linear_59_cast_fp16 = linear(bias = encoder_layers_9_fc2_bias_to_fp16, weight = encoder_layers_9_fc2_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor input_105_cast_fp16 = add(x = input_99_cast_fp16, y = linear_59_cast_fp16)[name = tensor("input_105_cast_fp16")]; tensor hidden_states_65_axes_0 = const()[name = tensor("hidden_states_65_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408194368)))]; tensor encoder_layers_10_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408196992)))]; tensor hidden_states_65_cast_fp16 = layer_norm(axes = hidden_states_65_axes_0, beta = encoder_layers_10_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_10_self_attn_layer_norm_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("hidden_states_65_cast_fp16")]; tensor encoder_layers_10_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408199616)))]; tensor encoder_layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411476480)))]; tensor linear_60_cast_fp16 = linear(bias = encoder_layers_10_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_q_proj_weight_to_fp16, x = hidden_states_65_cast_fp16)[name = tensor("linear_60_cast_fp16")]; tensor encoder_layers_10_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411479104)))]; tensor linear_61_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_10_self_attn_k_proj_weight_to_fp16, x = hidden_states_65_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor encoder_layers_10_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(414755968)))]; tensor encoder_layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418032832)))]; tensor linear_62_cast_fp16 = linear(bias = encoder_layers_10_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_v_proj_weight_to_fp16, x = hidden_states_65_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor var_663 = const()[name = tensor("op_663"), val = tensor([1, 1500, 20, 64])]; tensor var_664_cast_fp16 = reshape(shape = var_663, x = linear_60_cast_fp16)[name = tensor("op_664_cast_fp16")]; tensor var_666 = const()[name = tensor("op_666"), val = tensor([1, 1500, 20, 64])]; tensor var_667_cast_fp16 = reshape(shape = var_666, x = linear_61_cast_fp16)[name = tensor("op_667_cast_fp16")]; tensor var_669 = const()[name = tensor("op_669"), val = tensor([1, 1500, 20, 64])]; tensor var_670_cast_fp16 = reshape(shape = var_669, x = linear_62_cast_fp16)[name = tensor("op_670_cast_fp16")]; tensor value_43_perm_0 = const()[name = tensor("value_43_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_10_cast_fp16 = mul(x = var_664_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_10_cast_fp16")]; tensor matmul_10_transpose_y_0 = const()[name = tensor("matmul_10_transpose_y_0"), val = tensor(true)]; tensor matmul_10_transpose_x_0 = const()[name = tensor("matmul_10_transpose_x_0"), val = tensor(false)]; tensor transpose_148_perm_0 = const()[name = tensor("transpose_148_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_149_perm_0 = const()[name = tensor("transpose_149_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_149 = transpose(perm = transpose_149_perm_0, x = var_667_cast_fp16)[name = tensor("transpose_277")]; tensor transpose_148 = transpose(perm = transpose_148_perm_0, x = mul_10_cast_fp16)[name = tensor("transpose_278")]; tensor matmul_10_cast_fp16 = matmul(transpose_x = matmul_10_transpose_x_0, transpose_y = matmul_10_transpose_y_0, x = transpose_148, y = transpose_149)[name = tensor("matmul_10_cast_fp16")]; tensor softmax_10_axis_0 = const()[name = tensor("softmax_10_axis_0"), val = tensor(-1)]; tensor softmax_10_cast_fp16 = softmax(axis = softmax_10_axis_0, x = matmul_10_cast_fp16)[name = tensor("softmax_10_cast_fp16")]; tensor attn_output_21_transpose_x_0 = const()[name = tensor("attn_output_21_transpose_x_0"), val = tensor(false)]; tensor attn_output_21_transpose_y_0 = const()[name = tensor("attn_output_21_transpose_y_0"), val = tensor(false)]; tensor value_43_cast_fp16 = transpose(perm = value_43_perm_0, x = var_670_cast_fp16)[name = tensor("transpose_279")]; tensor attn_output_21_cast_fp16 = matmul(transpose_x = attn_output_21_transpose_x_0, transpose_y = attn_output_21_transpose_y_0, x = softmax_10_cast_fp16, y = value_43_cast_fp16)[name = tensor("attn_output_21_cast_fp16")]; tensor var_673_perm_0 = const()[name = tensor("op_673_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_675 = const()[name = tensor("op_675"), val = tensor([1, 1500, 1280])]; tensor var_673_cast_fp16 = transpose(perm = var_673_perm_0, x = attn_output_21_cast_fp16)[name = tensor("transpose_276")]; tensor input_107_cast_fp16 = reshape(shape = var_675, x = var_673_cast_fp16)[name = tensor("input_107_cast_fp16")]; tensor encoder_layers_10_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418035456)))]; tensor encoder_layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421312320)))]; tensor linear_63_cast_fp16 = linear(bias = encoder_layers_10_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_10_self_attn_out_proj_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor input_109_cast_fp16 = add(x = input_105_cast_fp16, y = linear_63_cast_fp16)[name = tensor("input_109_cast_fp16")]; tensor input_111_axes_0 = const()[name = tensor("input_111_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421314944)))]; tensor encoder_layers_10_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421317568)))]; tensor input_111_cast_fp16 = layer_norm(axes = input_111_axes_0, beta = encoder_layers_10_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_10_final_layer_norm_weight_to_fp16, x = input_109_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor encoder_layers_10_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421320192)))]; tensor encoder_layers_10_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(434427456)))]; tensor linear_64_cast_fp16 = linear(bias = encoder_layers_10_fc1_bias_to_fp16, weight = encoder_layers_10_fc1_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor input_113_mode_0 = const()[name = tensor("input_113_mode_0"), val = tensor("EXACT")]; tensor input_113_cast_fp16 = gelu(mode = input_113_mode_0, x = linear_64_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor encoder_layers_10_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(434437760)))]; tensor encoder_layers_10_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447545024)))]; tensor linear_65_cast_fp16 = linear(bias = encoder_layers_10_fc2_bias_to_fp16, weight = encoder_layers_10_fc2_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor input_115_cast_fp16 = add(x = input_109_cast_fp16, y = linear_65_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor hidden_states_71_axes_0 = const()[name = tensor("hidden_states_71_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447547648)))]; tensor encoder_layers_11_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447550272)))]; tensor hidden_states_71_cast_fp16 = layer_norm(axes = hidden_states_71_axes_0, beta = encoder_layers_11_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_11_self_attn_layer_norm_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("hidden_states_71_cast_fp16")]; tensor encoder_layers_11_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447552896)))]; tensor encoder_layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450829760)))]; tensor linear_66_cast_fp16 = linear(bias = encoder_layers_11_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_q_proj_weight_to_fp16, x = hidden_states_71_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor encoder_layers_11_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450832384)))]; tensor linear_67_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_11_self_attn_k_proj_weight_to_fp16, x = hidden_states_71_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor encoder_layers_11_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454109248)))]; tensor encoder_layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(457386112)))]; tensor linear_68_cast_fp16 = linear(bias = encoder_layers_11_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_v_proj_weight_to_fp16, x = hidden_states_71_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor var_716 = const()[name = tensor("op_716"), val = tensor([1, 1500, 20, 64])]; tensor var_717_cast_fp16 = reshape(shape = var_716, x = linear_66_cast_fp16)[name = tensor("op_717_cast_fp16")]; tensor var_719 = const()[name = tensor("op_719"), val = tensor([1, 1500, 20, 64])]; tensor var_720_cast_fp16 = reshape(shape = var_719, x = linear_67_cast_fp16)[name = tensor("op_720_cast_fp16")]; tensor var_722 = const()[name = tensor("op_722"), val = tensor([1, 1500, 20, 64])]; tensor var_723_cast_fp16 = reshape(shape = var_722, x = linear_68_cast_fp16)[name = tensor("op_723_cast_fp16")]; tensor value_47_perm_0 = const()[name = tensor("value_47_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_11_cast_fp16 = mul(x = var_717_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_11_cast_fp16")]; tensor matmul_11_transpose_y_0 = const()[name = tensor("matmul_11_transpose_y_0"), val = tensor(true)]; tensor matmul_11_transpose_x_0 = const()[name = tensor("matmul_11_transpose_x_0"), val = tensor(false)]; tensor transpose_150_perm_0 = const()[name = tensor("transpose_150_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_151_perm_0 = const()[name = tensor("transpose_151_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_151 = transpose(perm = transpose_151_perm_0, x = var_720_cast_fp16)[name = tensor("transpose_273")]; tensor transpose_150 = transpose(perm = transpose_150_perm_0, x = mul_11_cast_fp16)[name = tensor("transpose_274")]; tensor matmul_11_cast_fp16 = matmul(transpose_x = matmul_11_transpose_x_0, transpose_y = matmul_11_transpose_y_0, x = transpose_150, y = transpose_151)[name = tensor("matmul_11_cast_fp16")]; tensor softmax_11_axis_0 = const()[name = tensor("softmax_11_axis_0"), val = tensor(-1)]; tensor softmax_11_cast_fp16 = softmax(axis = softmax_11_axis_0, x = matmul_11_cast_fp16)[name = tensor("softmax_11_cast_fp16")]; tensor attn_output_23_transpose_x_0 = const()[name = tensor("attn_output_23_transpose_x_0"), val = tensor(false)]; tensor attn_output_23_transpose_y_0 = const()[name = tensor("attn_output_23_transpose_y_0"), val = tensor(false)]; tensor value_47_cast_fp16 = transpose(perm = value_47_perm_0, x = var_723_cast_fp16)[name = tensor("transpose_275")]; tensor attn_output_23_cast_fp16 = matmul(transpose_x = attn_output_23_transpose_x_0, transpose_y = attn_output_23_transpose_y_0, x = softmax_11_cast_fp16, y = value_47_cast_fp16)[name = tensor("attn_output_23_cast_fp16")]; tensor var_726_perm_0 = const()[name = tensor("op_726_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_728 = const()[name = tensor("op_728"), val = tensor([1, 1500, 1280])]; tensor var_726_cast_fp16 = transpose(perm = var_726_perm_0, x = attn_output_23_cast_fp16)[name = tensor("transpose_272")]; tensor input_117_cast_fp16 = reshape(shape = var_728, x = var_726_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor encoder_layers_11_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(457388736)))]; tensor encoder_layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460665600)))]; tensor linear_69_cast_fp16 = linear(bias = encoder_layers_11_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_11_self_attn_out_proj_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("linear_69_cast_fp16")]; tensor input_119_cast_fp16 = add(x = input_115_cast_fp16, y = linear_69_cast_fp16)[name = tensor("input_119_cast_fp16")]; tensor input_121_axes_0 = const()[name = tensor("input_121_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460668224)))]; tensor encoder_layers_11_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460670848)))]; tensor input_121_cast_fp16 = layer_norm(axes = input_121_axes_0, beta = encoder_layers_11_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_11_final_layer_norm_weight_to_fp16, x = input_119_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor encoder_layers_11_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460673472)))]; tensor encoder_layers_11_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473780736)))]; tensor linear_70_cast_fp16 = linear(bias = encoder_layers_11_fc1_bias_to_fp16, weight = encoder_layers_11_fc1_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor input_123_mode_0 = const()[name = tensor("input_123_mode_0"), val = tensor("EXACT")]; tensor input_123_cast_fp16 = gelu(mode = input_123_mode_0, x = linear_70_cast_fp16)[name = tensor("input_123_cast_fp16")]; tensor encoder_layers_11_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473791040)))]; tensor encoder_layers_11_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486898304)))]; tensor linear_71_cast_fp16 = linear(bias = encoder_layers_11_fc2_bias_to_fp16, weight = encoder_layers_11_fc2_weight_to_fp16, x = input_123_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor input_125_cast_fp16 = add(x = input_119_cast_fp16, y = linear_71_cast_fp16)[name = tensor("input_125_cast_fp16")]; tensor hidden_states_77_axes_0 = const()[name = tensor("hidden_states_77_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486900928)))]; tensor encoder_layers_12_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486903552)))]; tensor hidden_states_77_cast_fp16 = layer_norm(axes = hidden_states_77_axes_0, beta = encoder_layers_12_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_12_self_attn_layer_norm_weight_to_fp16, x = input_125_cast_fp16)[name = tensor("hidden_states_77_cast_fp16")]; tensor encoder_layers_12_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486906176)))]; tensor encoder_layers_12_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490183040)))]; tensor linear_72_cast_fp16 = linear(bias = encoder_layers_12_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_12_self_attn_q_proj_weight_to_fp16, x = hidden_states_77_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor encoder_layers_12_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490185664)))]; tensor linear_73_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_12_self_attn_k_proj_weight_to_fp16, x = hidden_states_77_cast_fp16)[name = tensor("linear_73_cast_fp16")]; tensor encoder_layers_12_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493462528)))]; tensor encoder_layers_12_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496739392)))]; tensor linear_74_cast_fp16 = linear(bias = encoder_layers_12_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_12_self_attn_v_proj_weight_to_fp16, x = hidden_states_77_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor var_769 = const()[name = tensor("op_769"), val = tensor([1, 1500, 20, 64])]; tensor var_770_cast_fp16 = reshape(shape = var_769, x = linear_72_cast_fp16)[name = tensor("op_770_cast_fp16")]; tensor var_772 = const()[name = tensor("op_772"), val = tensor([1, 1500, 20, 64])]; tensor var_773_cast_fp16 = reshape(shape = var_772, x = linear_73_cast_fp16)[name = tensor("op_773_cast_fp16")]; tensor var_775 = const()[name = tensor("op_775"), val = tensor([1, 1500, 20, 64])]; tensor var_776_cast_fp16 = reshape(shape = var_775, x = linear_74_cast_fp16)[name = tensor("op_776_cast_fp16")]; tensor value_51_perm_0 = const()[name = tensor("value_51_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_12_cast_fp16 = mul(x = var_770_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_12_cast_fp16")]; tensor matmul_12_transpose_y_0 = const()[name = tensor("matmul_12_transpose_y_0"), val = tensor(true)]; tensor matmul_12_transpose_x_0 = const()[name = tensor("matmul_12_transpose_x_0"), val = tensor(false)]; tensor transpose_152_perm_0 = const()[name = tensor("transpose_152_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_153_perm_0 = const()[name = tensor("transpose_153_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_153 = transpose(perm = transpose_153_perm_0, x = var_773_cast_fp16)[name = tensor("transpose_269")]; tensor transpose_152 = transpose(perm = transpose_152_perm_0, x = mul_12_cast_fp16)[name = tensor("transpose_270")]; tensor matmul_12_cast_fp16 = matmul(transpose_x = matmul_12_transpose_x_0, transpose_y = matmul_12_transpose_y_0, x = transpose_152, y = transpose_153)[name = tensor("matmul_12_cast_fp16")]; tensor softmax_12_axis_0 = const()[name = tensor("softmax_12_axis_0"), val = tensor(-1)]; tensor softmax_12_cast_fp16 = softmax(axis = softmax_12_axis_0, x = matmul_12_cast_fp16)[name = tensor("softmax_12_cast_fp16")]; tensor attn_output_25_transpose_x_0 = const()[name = tensor("attn_output_25_transpose_x_0"), val = tensor(false)]; tensor attn_output_25_transpose_y_0 = const()[name = tensor("attn_output_25_transpose_y_0"), val = tensor(false)]; tensor value_51_cast_fp16 = transpose(perm = value_51_perm_0, x = var_776_cast_fp16)[name = tensor("transpose_271")]; tensor attn_output_25_cast_fp16 = matmul(transpose_x = attn_output_25_transpose_x_0, transpose_y = attn_output_25_transpose_y_0, x = softmax_12_cast_fp16, y = value_51_cast_fp16)[name = tensor("attn_output_25_cast_fp16")]; tensor var_779_perm_0 = const()[name = tensor("op_779_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_781 = const()[name = tensor("op_781"), val = tensor([1, 1500, 1280])]; tensor var_779_cast_fp16 = transpose(perm = var_779_perm_0, x = attn_output_25_cast_fp16)[name = tensor("transpose_268")]; tensor input_127_cast_fp16 = reshape(shape = var_781, x = var_779_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor encoder_layers_12_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496742016)))]; tensor encoder_layers_12_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500018880)))]; tensor linear_75_cast_fp16 = linear(bias = encoder_layers_12_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_12_self_attn_out_proj_weight_to_fp16, x = input_127_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor input_129_cast_fp16 = add(x = input_125_cast_fp16, y = linear_75_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor input_131_axes_0 = const()[name = tensor("input_131_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_12_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500021504)))]; tensor encoder_layers_12_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_12_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500024128)))]; tensor input_131_cast_fp16 = layer_norm(axes = input_131_axes_0, beta = encoder_layers_12_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_12_final_layer_norm_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor encoder_layers_12_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500026752)))]; tensor encoder_layers_12_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_12_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513134016)))]; tensor linear_76_cast_fp16 = linear(bias = encoder_layers_12_fc1_bias_to_fp16, weight = encoder_layers_12_fc1_weight_to_fp16, x = input_131_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor input_133_mode_0 = const()[name = tensor("input_133_mode_0"), val = tensor("EXACT")]; tensor input_133_cast_fp16 = gelu(mode = input_133_mode_0, x = linear_76_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor encoder_layers_12_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513144320)))]; tensor encoder_layers_12_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_12_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526251584)))]; tensor linear_77_cast_fp16 = linear(bias = encoder_layers_12_fc2_bias_to_fp16, weight = encoder_layers_12_fc2_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor input_135_cast_fp16 = add(x = input_129_cast_fp16, y = linear_77_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor hidden_states_83_axes_0 = const()[name = tensor("hidden_states_83_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526254208)))]; tensor encoder_layers_13_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526256832)))]; tensor hidden_states_83_cast_fp16 = layer_norm(axes = hidden_states_83_axes_0, beta = encoder_layers_13_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_13_self_attn_layer_norm_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("hidden_states_83_cast_fp16")]; tensor encoder_layers_13_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526259456)))]; tensor encoder_layers_13_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529536320)))]; tensor linear_78_cast_fp16 = linear(bias = encoder_layers_13_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_13_self_attn_q_proj_weight_to_fp16, x = hidden_states_83_cast_fp16)[name = tensor("linear_78_cast_fp16")]; tensor encoder_layers_13_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529538944)))]; tensor linear_79_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_13_self_attn_k_proj_weight_to_fp16, x = hidden_states_83_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor encoder_layers_13_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(532815808)))]; tensor encoder_layers_13_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(536092672)))]; tensor linear_80_cast_fp16 = linear(bias = encoder_layers_13_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_13_self_attn_v_proj_weight_to_fp16, x = hidden_states_83_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor var_822 = const()[name = tensor("op_822"), val = tensor([1, 1500, 20, 64])]; tensor var_823_cast_fp16 = reshape(shape = var_822, x = linear_78_cast_fp16)[name = tensor("op_823_cast_fp16")]; tensor var_825 = const()[name = tensor("op_825"), val = tensor([1, 1500, 20, 64])]; tensor var_826_cast_fp16 = reshape(shape = var_825, x = linear_79_cast_fp16)[name = tensor("op_826_cast_fp16")]; tensor var_828 = const()[name = tensor("op_828"), val = tensor([1, 1500, 20, 64])]; tensor var_829_cast_fp16 = reshape(shape = var_828, x = linear_80_cast_fp16)[name = tensor("op_829_cast_fp16")]; tensor value_55_perm_0 = const()[name = tensor("value_55_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_13_cast_fp16 = mul(x = var_823_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_13_cast_fp16")]; tensor matmul_13_transpose_y_0 = const()[name = tensor("matmul_13_transpose_y_0"), val = tensor(true)]; tensor matmul_13_transpose_x_0 = const()[name = tensor("matmul_13_transpose_x_0"), val = tensor(false)]; tensor transpose_154_perm_0 = const()[name = tensor("transpose_154_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_155_perm_0 = const()[name = tensor("transpose_155_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_155 = transpose(perm = transpose_155_perm_0, x = var_826_cast_fp16)[name = tensor("transpose_265")]; tensor transpose_154 = transpose(perm = transpose_154_perm_0, x = mul_13_cast_fp16)[name = tensor("transpose_266")]; tensor matmul_13_cast_fp16 = matmul(transpose_x = matmul_13_transpose_x_0, transpose_y = matmul_13_transpose_y_0, x = transpose_154, y = transpose_155)[name = tensor("matmul_13_cast_fp16")]; tensor softmax_13_axis_0 = const()[name = tensor("softmax_13_axis_0"), val = tensor(-1)]; tensor softmax_13_cast_fp16 = softmax(axis = softmax_13_axis_0, x = matmul_13_cast_fp16)[name = tensor("softmax_13_cast_fp16")]; tensor attn_output_27_transpose_x_0 = const()[name = tensor("attn_output_27_transpose_x_0"), val = tensor(false)]; tensor attn_output_27_transpose_y_0 = const()[name = tensor("attn_output_27_transpose_y_0"), val = tensor(false)]; tensor value_55_cast_fp16 = transpose(perm = value_55_perm_0, x = var_829_cast_fp16)[name = tensor("transpose_267")]; tensor attn_output_27_cast_fp16 = matmul(transpose_x = attn_output_27_transpose_x_0, transpose_y = attn_output_27_transpose_y_0, x = softmax_13_cast_fp16, y = value_55_cast_fp16)[name = tensor("attn_output_27_cast_fp16")]; tensor var_832_perm_0 = const()[name = tensor("op_832_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_834 = const()[name = tensor("op_834"), val = tensor([1, 1500, 1280])]; tensor var_832_cast_fp16 = transpose(perm = var_832_perm_0, x = attn_output_27_cast_fp16)[name = tensor("transpose_264")]; tensor input_137_cast_fp16 = reshape(shape = var_834, x = var_832_cast_fp16)[name = tensor("input_137_cast_fp16")]; tensor encoder_layers_13_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(536095296)))]; tensor encoder_layers_13_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539372160)))]; tensor linear_81_cast_fp16 = linear(bias = encoder_layers_13_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_13_self_attn_out_proj_weight_to_fp16, x = input_137_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor input_139_cast_fp16 = add(x = input_135_cast_fp16, y = linear_81_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor input_141_axes_0 = const()[name = tensor("input_141_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_13_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539374784)))]; tensor encoder_layers_13_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_13_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539377408)))]; tensor input_141_cast_fp16 = layer_norm(axes = input_141_axes_0, beta = encoder_layers_13_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_13_final_layer_norm_weight_to_fp16, x = input_139_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor encoder_layers_13_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539380032)))]; tensor encoder_layers_13_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_13_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552487296)))]; tensor linear_82_cast_fp16 = linear(bias = encoder_layers_13_fc1_bias_to_fp16, weight = encoder_layers_13_fc1_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("linear_82_cast_fp16")]; tensor input_143_mode_0 = const()[name = tensor("input_143_mode_0"), val = tensor("EXACT")]; tensor input_143_cast_fp16 = gelu(mode = input_143_mode_0, x = linear_82_cast_fp16)[name = tensor("input_143_cast_fp16")]; tensor encoder_layers_13_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552497600)))]; tensor encoder_layers_13_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_13_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565604864)))]; tensor linear_83_cast_fp16 = linear(bias = encoder_layers_13_fc2_bias_to_fp16, weight = encoder_layers_13_fc2_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("linear_83_cast_fp16")]; tensor input_145_cast_fp16 = add(x = input_139_cast_fp16, y = linear_83_cast_fp16)[name = tensor("input_145_cast_fp16")]; tensor hidden_states_89_axes_0 = const()[name = tensor("hidden_states_89_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565607488)))]; tensor encoder_layers_14_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565610112)))]; tensor hidden_states_89_cast_fp16 = layer_norm(axes = hidden_states_89_axes_0, beta = encoder_layers_14_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_14_self_attn_layer_norm_weight_to_fp16, x = input_145_cast_fp16)[name = tensor("hidden_states_89_cast_fp16")]; tensor encoder_layers_14_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565612736)))]; tensor encoder_layers_14_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568889600)))]; tensor linear_84_cast_fp16 = linear(bias = encoder_layers_14_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_14_self_attn_q_proj_weight_to_fp16, x = hidden_states_89_cast_fp16)[name = tensor("linear_84_cast_fp16")]; tensor encoder_layers_14_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568892224)))]; tensor linear_85_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_14_self_attn_k_proj_weight_to_fp16, x = hidden_states_89_cast_fp16)[name = tensor("linear_85_cast_fp16")]; tensor encoder_layers_14_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572169088)))]; tensor encoder_layers_14_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575445952)))]; tensor linear_86_cast_fp16 = linear(bias = encoder_layers_14_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_14_self_attn_v_proj_weight_to_fp16, x = hidden_states_89_cast_fp16)[name = tensor("linear_86_cast_fp16")]; tensor var_875 = const()[name = tensor("op_875"), val = tensor([1, 1500, 20, 64])]; tensor var_876_cast_fp16 = reshape(shape = var_875, x = linear_84_cast_fp16)[name = tensor("op_876_cast_fp16")]; tensor var_878 = const()[name = tensor("op_878"), val = tensor([1, 1500, 20, 64])]; tensor var_879_cast_fp16 = reshape(shape = var_878, x = linear_85_cast_fp16)[name = tensor("op_879_cast_fp16")]; tensor var_881 = const()[name = tensor("op_881"), val = tensor([1, 1500, 20, 64])]; tensor var_882_cast_fp16 = reshape(shape = var_881, x = linear_86_cast_fp16)[name = tensor("op_882_cast_fp16")]; tensor value_59_perm_0 = const()[name = tensor("value_59_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_14_cast_fp16 = mul(x = var_876_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_14_cast_fp16")]; tensor matmul_14_transpose_y_0 = const()[name = tensor("matmul_14_transpose_y_0"), val = tensor(true)]; tensor matmul_14_transpose_x_0 = const()[name = tensor("matmul_14_transpose_x_0"), val = tensor(false)]; tensor transpose_156_perm_0 = const()[name = tensor("transpose_156_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_157_perm_0 = const()[name = tensor("transpose_157_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_157 = transpose(perm = transpose_157_perm_0, x = var_879_cast_fp16)[name = tensor("transpose_261")]; tensor transpose_156 = transpose(perm = transpose_156_perm_0, x = mul_14_cast_fp16)[name = tensor("transpose_262")]; tensor matmul_14_cast_fp16 = matmul(transpose_x = matmul_14_transpose_x_0, transpose_y = matmul_14_transpose_y_0, x = transpose_156, y = transpose_157)[name = tensor("matmul_14_cast_fp16")]; tensor softmax_14_axis_0 = const()[name = tensor("softmax_14_axis_0"), val = tensor(-1)]; tensor softmax_14_cast_fp16 = softmax(axis = softmax_14_axis_0, x = matmul_14_cast_fp16)[name = tensor("softmax_14_cast_fp16")]; tensor attn_output_29_transpose_x_0 = const()[name = tensor("attn_output_29_transpose_x_0"), val = tensor(false)]; tensor attn_output_29_transpose_y_0 = const()[name = tensor("attn_output_29_transpose_y_0"), val = tensor(false)]; tensor value_59_cast_fp16 = transpose(perm = value_59_perm_0, x = var_882_cast_fp16)[name = tensor("transpose_263")]; tensor attn_output_29_cast_fp16 = matmul(transpose_x = attn_output_29_transpose_x_0, transpose_y = attn_output_29_transpose_y_0, x = softmax_14_cast_fp16, y = value_59_cast_fp16)[name = tensor("attn_output_29_cast_fp16")]; tensor var_885_perm_0 = const()[name = tensor("op_885_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_887 = const()[name = tensor("op_887"), val = tensor([1, 1500, 1280])]; tensor var_885_cast_fp16 = transpose(perm = var_885_perm_0, x = attn_output_29_cast_fp16)[name = tensor("transpose_260")]; tensor input_147_cast_fp16 = reshape(shape = var_887, x = var_885_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor encoder_layers_14_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575448576)))]; tensor encoder_layers_14_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578725440)))]; tensor linear_87_cast_fp16 = linear(bias = encoder_layers_14_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_14_self_attn_out_proj_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("linear_87_cast_fp16")]; tensor input_149_cast_fp16 = add(x = input_145_cast_fp16, y = linear_87_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor input_151_axes_0 = const()[name = tensor("input_151_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_14_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578728064)))]; tensor encoder_layers_14_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_14_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578730688)))]; tensor input_151_cast_fp16 = layer_norm(axes = input_151_axes_0, beta = encoder_layers_14_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_14_final_layer_norm_weight_to_fp16, x = input_149_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor encoder_layers_14_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578733312)))]; tensor encoder_layers_14_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_14_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591840576)))]; tensor linear_88_cast_fp16 = linear(bias = encoder_layers_14_fc1_bias_to_fp16, weight = encoder_layers_14_fc1_weight_to_fp16, x = input_151_cast_fp16)[name = tensor("linear_88_cast_fp16")]; tensor input_153_mode_0 = const()[name = tensor("input_153_mode_0"), val = tensor("EXACT")]; tensor input_153_cast_fp16 = gelu(mode = input_153_mode_0, x = linear_88_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor encoder_layers_14_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591850880)))]; tensor encoder_layers_14_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_14_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604958144)))]; tensor linear_89_cast_fp16 = linear(bias = encoder_layers_14_fc2_bias_to_fp16, weight = encoder_layers_14_fc2_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("linear_89_cast_fp16")]; tensor input_155_cast_fp16 = add(x = input_149_cast_fp16, y = linear_89_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor hidden_states_95_axes_0 = const()[name = tensor("hidden_states_95_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604960768)))]; tensor encoder_layers_15_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604963392)))]; tensor hidden_states_95_cast_fp16 = layer_norm(axes = hidden_states_95_axes_0, beta = encoder_layers_15_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_15_self_attn_layer_norm_weight_to_fp16, x = input_155_cast_fp16)[name = tensor("hidden_states_95_cast_fp16")]; tensor encoder_layers_15_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604966016)))]; tensor encoder_layers_15_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608242880)))]; tensor linear_90_cast_fp16 = linear(bias = encoder_layers_15_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_15_self_attn_q_proj_weight_to_fp16, x = hidden_states_95_cast_fp16)[name = tensor("linear_90_cast_fp16")]; tensor encoder_layers_15_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608245504)))]; tensor linear_91_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_15_self_attn_k_proj_weight_to_fp16, x = hidden_states_95_cast_fp16)[name = tensor("linear_91_cast_fp16")]; tensor encoder_layers_15_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(611522368)))]; tensor encoder_layers_15_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614799232)))]; tensor linear_92_cast_fp16 = linear(bias = encoder_layers_15_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_15_self_attn_v_proj_weight_to_fp16, x = hidden_states_95_cast_fp16)[name = tensor("linear_92_cast_fp16")]; tensor var_928 = const()[name = tensor("op_928"), val = tensor([1, 1500, 20, 64])]; tensor var_929_cast_fp16 = reshape(shape = var_928, x = linear_90_cast_fp16)[name = tensor("op_929_cast_fp16")]; tensor var_931 = const()[name = tensor("op_931"), val = tensor([1, 1500, 20, 64])]; tensor var_932_cast_fp16 = reshape(shape = var_931, x = linear_91_cast_fp16)[name = tensor("op_932_cast_fp16")]; tensor var_934 = const()[name = tensor("op_934"), val = tensor([1, 1500, 20, 64])]; tensor var_935_cast_fp16 = reshape(shape = var_934, x = linear_92_cast_fp16)[name = tensor("op_935_cast_fp16")]; tensor value_63_perm_0 = const()[name = tensor("value_63_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_15_cast_fp16 = mul(x = var_929_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_15_cast_fp16")]; tensor matmul_15_transpose_y_0 = const()[name = tensor("matmul_15_transpose_y_0"), val = tensor(true)]; tensor matmul_15_transpose_x_0 = const()[name = tensor("matmul_15_transpose_x_0"), val = tensor(false)]; tensor transpose_158_perm_0 = const()[name = tensor("transpose_158_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_159_perm_0 = const()[name = tensor("transpose_159_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_159 = transpose(perm = transpose_159_perm_0, x = var_932_cast_fp16)[name = tensor("transpose_257")]; tensor transpose_158 = transpose(perm = transpose_158_perm_0, x = mul_15_cast_fp16)[name = tensor("transpose_258")]; tensor matmul_15_cast_fp16 = matmul(transpose_x = matmul_15_transpose_x_0, transpose_y = matmul_15_transpose_y_0, x = transpose_158, y = transpose_159)[name = tensor("matmul_15_cast_fp16")]; tensor softmax_15_axis_0 = const()[name = tensor("softmax_15_axis_0"), val = tensor(-1)]; tensor softmax_15_cast_fp16 = softmax(axis = softmax_15_axis_0, x = matmul_15_cast_fp16)[name = tensor("softmax_15_cast_fp16")]; tensor attn_output_31_transpose_x_0 = const()[name = tensor("attn_output_31_transpose_x_0"), val = tensor(false)]; tensor attn_output_31_transpose_y_0 = const()[name = tensor("attn_output_31_transpose_y_0"), val = tensor(false)]; tensor value_63_cast_fp16 = transpose(perm = value_63_perm_0, x = var_935_cast_fp16)[name = tensor("transpose_259")]; tensor attn_output_31_cast_fp16 = matmul(transpose_x = attn_output_31_transpose_x_0, transpose_y = attn_output_31_transpose_y_0, x = softmax_15_cast_fp16, y = value_63_cast_fp16)[name = tensor("attn_output_31_cast_fp16")]; tensor var_938_perm_0 = const()[name = tensor("op_938_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_940 = const()[name = tensor("op_940"), val = tensor([1, 1500, 1280])]; tensor var_938_cast_fp16 = transpose(perm = var_938_perm_0, x = attn_output_31_cast_fp16)[name = tensor("transpose_256")]; tensor input_157_cast_fp16 = reshape(shape = var_940, x = var_938_cast_fp16)[name = tensor("input_157_cast_fp16")]; tensor encoder_layers_15_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614801856)))]; tensor encoder_layers_15_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618078720)))]; tensor linear_93_cast_fp16 = linear(bias = encoder_layers_15_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_15_self_attn_out_proj_weight_to_fp16, x = input_157_cast_fp16)[name = tensor("linear_93_cast_fp16")]; tensor input_159_cast_fp16 = add(x = input_155_cast_fp16, y = linear_93_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor input_161_axes_0 = const()[name = tensor("input_161_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_15_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618081344)))]; tensor encoder_layers_15_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_15_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618083968)))]; tensor input_161_cast_fp16 = layer_norm(axes = input_161_axes_0, beta = encoder_layers_15_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_15_final_layer_norm_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor encoder_layers_15_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618086592)))]; tensor encoder_layers_15_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_15_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631193856)))]; tensor linear_94_cast_fp16 = linear(bias = encoder_layers_15_fc1_bias_to_fp16, weight = encoder_layers_15_fc1_weight_to_fp16, x = input_161_cast_fp16)[name = tensor("linear_94_cast_fp16")]; tensor input_163_mode_0 = const()[name = tensor("input_163_mode_0"), val = tensor("EXACT")]; tensor input_163_cast_fp16 = gelu(mode = input_163_mode_0, x = linear_94_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor encoder_layers_15_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631204160)))]; tensor encoder_layers_15_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_15_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644311424)))]; tensor linear_95_cast_fp16 = linear(bias = encoder_layers_15_fc2_bias_to_fp16, weight = encoder_layers_15_fc2_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("linear_95_cast_fp16")]; tensor input_165_cast_fp16 = add(x = input_159_cast_fp16, y = linear_95_cast_fp16)[name = tensor("input_165_cast_fp16")]; tensor hidden_states_101_axes_0 = const()[name = tensor("hidden_states_101_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644314048)))]; tensor encoder_layers_16_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644316672)))]; tensor hidden_states_101_cast_fp16 = layer_norm(axes = hidden_states_101_axes_0, beta = encoder_layers_16_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_16_self_attn_layer_norm_weight_to_fp16, x = input_165_cast_fp16)[name = tensor("hidden_states_101_cast_fp16")]; tensor encoder_layers_16_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644319296)))]; tensor encoder_layers_16_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647596160)))]; tensor linear_96_cast_fp16 = linear(bias = encoder_layers_16_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_16_self_attn_q_proj_weight_to_fp16, x = hidden_states_101_cast_fp16)[name = tensor("linear_96_cast_fp16")]; tensor encoder_layers_16_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647598784)))]; tensor linear_97_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_16_self_attn_k_proj_weight_to_fp16, x = hidden_states_101_cast_fp16)[name = tensor("linear_97_cast_fp16")]; tensor encoder_layers_16_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(650875648)))]; tensor encoder_layers_16_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654152512)))]; tensor linear_98_cast_fp16 = linear(bias = encoder_layers_16_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_16_self_attn_v_proj_weight_to_fp16, x = hidden_states_101_cast_fp16)[name = tensor("linear_98_cast_fp16")]; tensor var_981 = const()[name = tensor("op_981"), val = tensor([1, 1500, 20, 64])]; tensor var_982_cast_fp16 = reshape(shape = var_981, x = linear_96_cast_fp16)[name = tensor("op_982_cast_fp16")]; tensor var_984 = const()[name = tensor("op_984"), val = tensor([1, 1500, 20, 64])]; tensor var_985_cast_fp16 = reshape(shape = var_984, x = linear_97_cast_fp16)[name = tensor("op_985_cast_fp16")]; tensor var_987 = const()[name = tensor("op_987"), val = tensor([1, 1500, 20, 64])]; tensor var_988_cast_fp16 = reshape(shape = var_987, x = linear_98_cast_fp16)[name = tensor("op_988_cast_fp16")]; tensor value_67_perm_0 = const()[name = tensor("value_67_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_16_cast_fp16 = mul(x = var_982_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_16_cast_fp16")]; tensor matmul_16_transpose_y_0 = const()[name = tensor("matmul_16_transpose_y_0"), val = tensor(true)]; tensor matmul_16_transpose_x_0 = const()[name = tensor("matmul_16_transpose_x_0"), val = tensor(false)]; tensor transpose_160_perm_0 = const()[name = tensor("transpose_160_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_161_perm_0 = const()[name = tensor("transpose_161_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_161 = transpose(perm = transpose_161_perm_0, x = var_985_cast_fp16)[name = tensor("transpose_253")]; tensor transpose_160 = transpose(perm = transpose_160_perm_0, x = mul_16_cast_fp16)[name = tensor("transpose_254")]; tensor matmul_16_cast_fp16 = matmul(transpose_x = matmul_16_transpose_x_0, transpose_y = matmul_16_transpose_y_0, x = transpose_160, y = transpose_161)[name = tensor("matmul_16_cast_fp16")]; tensor softmax_16_axis_0 = const()[name = tensor("softmax_16_axis_0"), val = tensor(-1)]; tensor softmax_16_cast_fp16 = softmax(axis = softmax_16_axis_0, x = matmul_16_cast_fp16)[name = tensor("softmax_16_cast_fp16")]; tensor attn_output_33_transpose_x_0 = const()[name = tensor("attn_output_33_transpose_x_0"), val = tensor(false)]; tensor attn_output_33_transpose_y_0 = const()[name = tensor("attn_output_33_transpose_y_0"), val = tensor(false)]; tensor value_67_cast_fp16 = transpose(perm = value_67_perm_0, x = var_988_cast_fp16)[name = tensor("transpose_255")]; tensor attn_output_33_cast_fp16 = matmul(transpose_x = attn_output_33_transpose_x_0, transpose_y = attn_output_33_transpose_y_0, x = softmax_16_cast_fp16, y = value_67_cast_fp16)[name = tensor("attn_output_33_cast_fp16")]; tensor var_991_perm_0 = const()[name = tensor("op_991_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_993 = const()[name = tensor("op_993"), val = tensor([1, 1500, 1280])]; tensor var_991_cast_fp16 = transpose(perm = var_991_perm_0, x = attn_output_33_cast_fp16)[name = tensor("transpose_252")]; tensor input_167_cast_fp16 = reshape(shape = var_993, x = var_991_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor encoder_layers_16_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654155136)))]; tensor encoder_layers_16_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657432000)))]; tensor linear_99_cast_fp16 = linear(bias = encoder_layers_16_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_16_self_attn_out_proj_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("linear_99_cast_fp16")]; tensor input_169_cast_fp16 = add(x = input_165_cast_fp16, y = linear_99_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor input_171_axes_0 = const()[name = tensor("input_171_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_16_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657434624)))]; tensor encoder_layers_16_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_16_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657437248)))]; tensor input_171_cast_fp16 = layer_norm(axes = input_171_axes_0, beta = encoder_layers_16_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_16_final_layer_norm_weight_to_fp16, x = input_169_cast_fp16)[name = tensor("input_171_cast_fp16")]; tensor encoder_layers_16_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657439872)))]; tensor encoder_layers_16_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_16_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670547136)))]; tensor linear_100_cast_fp16 = linear(bias = encoder_layers_16_fc1_bias_to_fp16, weight = encoder_layers_16_fc1_weight_to_fp16, x = input_171_cast_fp16)[name = tensor("linear_100_cast_fp16")]; tensor input_173_mode_0 = const()[name = tensor("input_173_mode_0"), val = tensor("EXACT")]; tensor input_173_cast_fp16 = gelu(mode = input_173_mode_0, x = linear_100_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor encoder_layers_16_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670557440)))]; tensor encoder_layers_16_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_16_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683664704)))]; tensor linear_101_cast_fp16 = linear(bias = encoder_layers_16_fc2_bias_to_fp16, weight = encoder_layers_16_fc2_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("linear_101_cast_fp16")]; tensor input_175_cast_fp16 = add(x = input_169_cast_fp16, y = linear_101_cast_fp16)[name = tensor("input_175_cast_fp16")]; tensor hidden_states_107_axes_0 = const()[name = tensor("hidden_states_107_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683667328)))]; tensor encoder_layers_17_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683669952)))]; tensor hidden_states_107_cast_fp16 = layer_norm(axes = hidden_states_107_axes_0, beta = encoder_layers_17_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_17_self_attn_layer_norm_weight_to_fp16, x = input_175_cast_fp16)[name = tensor("hidden_states_107_cast_fp16")]; tensor encoder_layers_17_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683672576)))]; tensor encoder_layers_17_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686949440)))]; tensor linear_102_cast_fp16 = linear(bias = encoder_layers_17_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_17_self_attn_q_proj_weight_to_fp16, x = hidden_states_107_cast_fp16)[name = tensor("linear_102_cast_fp16")]; tensor encoder_layers_17_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686952064)))]; tensor linear_103_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_17_self_attn_k_proj_weight_to_fp16, x = hidden_states_107_cast_fp16)[name = tensor("linear_103_cast_fp16")]; tensor encoder_layers_17_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(690228928)))]; tensor encoder_layers_17_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693505792)))]; tensor linear_104_cast_fp16 = linear(bias = encoder_layers_17_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_17_self_attn_v_proj_weight_to_fp16, x = hidden_states_107_cast_fp16)[name = tensor("linear_104_cast_fp16")]; tensor var_1034 = const()[name = tensor("op_1034"), val = tensor([1, 1500, 20, 64])]; tensor var_1035_cast_fp16 = reshape(shape = var_1034, x = linear_102_cast_fp16)[name = tensor("op_1035_cast_fp16")]; tensor var_1037 = const()[name = tensor("op_1037"), val = tensor([1, 1500, 20, 64])]; tensor var_1038_cast_fp16 = reshape(shape = var_1037, x = linear_103_cast_fp16)[name = tensor("op_1038_cast_fp16")]; tensor var_1040 = const()[name = tensor("op_1040"), val = tensor([1, 1500, 20, 64])]; tensor var_1041_cast_fp16 = reshape(shape = var_1040, x = linear_104_cast_fp16)[name = tensor("op_1041_cast_fp16")]; tensor value_71_perm_0 = const()[name = tensor("value_71_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_17_cast_fp16 = mul(x = var_1035_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_17_cast_fp16")]; tensor matmul_17_transpose_y_0 = const()[name = tensor("matmul_17_transpose_y_0"), val = tensor(true)]; tensor matmul_17_transpose_x_0 = const()[name = tensor("matmul_17_transpose_x_0"), val = tensor(false)]; tensor transpose_162_perm_0 = const()[name = tensor("transpose_162_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_163_perm_0 = const()[name = tensor("transpose_163_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_163 = transpose(perm = transpose_163_perm_0, x = var_1038_cast_fp16)[name = tensor("transpose_249")]; tensor transpose_162 = transpose(perm = transpose_162_perm_0, x = mul_17_cast_fp16)[name = tensor("transpose_250")]; tensor matmul_17_cast_fp16 = matmul(transpose_x = matmul_17_transpose_x_0, transpose_y = matmul_17_transpose_y_0, x = transpose_162, y = transpose_163)[name = tensor("matmul_17_cast_fp16")]; tensor softmax_17_axis_0 = const()[name = tensor("softmax_17_axis_0"), val = tensor(-1)]; tensor softmax_17_cast_fp16 = softmax(axis = softmax_17_axis_0, x = matmul_17_cast_fp16)[name = tensor("softmax_17_cast_fp16")]; tensor attn_output_35_transpose_x_0 = const()[name = tensor("attn_output_35_transpose_x_0"), val = tensor(false)]; tensor attn_output_35_transpose_y_0 = const()[name = tensor("attn_output_35_transpose_y_0"), val = tensor(false)]; tensor value_71_cast_fp16 = transpose(perm = value_71_perm_0, x = var_1041_cast_fp16)[name = tensor("transpose_251")]; tensor attn_output_35_cast_fp16 = matmul(transpose_x = attn_output_35_transpose_x_0, transpose_y = attn_output_35_transpose_y_0, x = softmax_17_cast_fp16, y = value_71_cast_fp16)[name = tensor("attn_output_35_cast_fp16")]; tensor var_1044_perm_0 = const()[name = tensor("op_1044_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1046 = const()[name = tensor("op_1046"), val = tensor([1, 1500, 1280])]; tensor var_1044_cast_fp16 = transpose(perm = var_1044_perm_0, x = attn_output_35_cast_fp16)[name = tensor("transpose_248")]; tensor input_177_cast_fp16 = reshape(shape = var_1046, x = var_1044_cast_fp16)[name = tensor("input_177_cast_fp16")]; tensor encoder_layers_17_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693508416)))]; tensor encoder_layers_17_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_17_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696785280)))]; tensor linear_105_cast_fp16 = linear(bias = encoder_layers_17_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_17_self_attn_out_proj_weight_to_fp16, x = input_177_cast_fp16)[name = tensor("linear_105_cast_fp16")]; tensor input_179_cast_fp16 = add(x = input_175_cast_fp16, y = linear_105_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor input_181_axes_0 = const()[name = tensor("input_181_axes_0"), val = tensor([-1])]; tensor encoder_layers_17_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_17_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696787904)))]; tensor encoder_layers_17_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_17_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696790528)))]; tensor input_181_cast_fp16 = layer_norm(axes = input_181_axes_0, beta = encoder_layers_17_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_17_final_layer_norm_weight_to_fp16, x = input_179_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor encoder_layers_17_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_17_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696793152)))]; tensor encoder_layers_17_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_17_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709900416)))]; tensor linear_106_cast_fp16 = linear(bias = encoder_layers_17_fc1_bias_to_fp16, weight = encoder_layers_17_fc1_weight_to_fp16, x = input_181_cast_fp16)[name = tensor("linear_106_cast_fp16")]; tensor input_183_mode_0 = const()[name = tensor("input_183_mode_0"), val = tensor("EXACT")]; tensor input_183_cast_fp16 = gelu(mode = input_183_mode_0, x = linear_106_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor encoder_layers_17_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_17_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709910720)))]; tensor encoder_layers_17_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_17_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723017984)))]; tensor linear_107_cast_fp16 = linear(bias = encoder_layers_17_fc2_bias_to_fp16, weight = encoder_layers_17_fc2_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("linear_107_cast_fp16")]; tensor input_185_cast_fp16 = add(x = input_179_cast_fp16, y = linear_107_cast_fp16)[name = tensor("input_185_cast_fp16")]; tensor hidden_states_113_axes_0 = const()[name = tensor("hidden_states_113_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723020608)))]; tensor encoder_layers_18_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723023232)))]; tensor hidden_states_113_cast_fp16 = layer_norm(axes = hidden_states_113_axes_0, beta = encoder_layers_18_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_18_self_attn_layer_norm_weight_to_fp16, x = input_185_cast_fp16)[name = tensor("hidden_states_113_cast_fp16")]; tensor encoder_layers_18_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723025856)))]; tensor encoder_layers_18_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(726302720)))]; tensor linear_108_cast_fp16 = linear(bias = encoder_layers_18_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_18_self_attn_q_proj_weight_to_fp16, x = hidden_states_113_cast_fp16)[name = tensor("linear_108_cast_fp16")]; tensor encoder_layers_18_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(726305344)))]; tensor linear_109_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_18_self_attn_k_proj_weight_to_fp16, x = hidden_states_113_cast_fp16)[name = tensor("linear_109_cast_fp16")]; tensor encoder_layers_18_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(729582208)))]; tensor encoder_layers_18_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732859072)))]; tensor linear_110_cast_fp16 = linear(bias = encoder_layers_18_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_18_self_attn_v_proj_weight_to_fp16, x = hidden_states_113_cast_fp16)[name = tensor("linear_110_cast_fp16")]; tensor var_1087 = const()[name = tensor("op_1087"), val = tensor([1, 1500, 20, 64])]; tensor var_1088_cast_fp16 = reshape(shape = var_1087, x = linear_108_cast_fp16)[name = tensor("op_1088_cast_fp16")]; tensor var_1090 = const()[name = tensor("op_1090"), val = tensor([1, 1500, 20, 64])]; tensor var_1091_cast_fp16 = reshape(shape = var_1090, x = linear_109_cast_fp16)[name = tensor("op_1091_cast_fp16")]; tensor var_1093 = const()[name = tensor("op_1093"), val = tensor([1, 1500, 20, 64])]; tensor var_1094_cast_fp16 = reshape(shape = var_1093, x = linear_110_cast_fp16)[name = tensor("op_1094_cast_fp16")]; tensor value_75_perm_0 = const()[name = tensor("value_75_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_18_cast_fp16 = mul(x = var_1088_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_18_cast_fp16")]; tensor matmul_18_transpose_y_0 = const()[name = tensor("matmul_18_transpose_y_0"), val = tensor(true)]; tensor matmul_18_transpose_x_0 = const()[name = tensor("matmul_18_transpose_x_0"), val = tensor(false)]; tensor transpose_164_perm_0 = const()[name = tensor("transpose_164_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_165_perm_0 = const()[name = tensor("transpose_165_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_165 = transpose(perm = transpose_165_perm_0, x = var_1091_cast_fp16)[name = tensor("transpose_245")]; tensor transpose_164 = transpose(perm = transpose_164_perm_0, x = mul_18_cast_fp16)[name = tensor("transpose_246")]; tensor matmul_18_cast_fp16 = matmul(transpose_x = matmul_18_transpose_x_0, transpose_y = matmul_18_transpose_y_0, x = transpose_164, y = transpose_165)[name = tensor("matmul_18_cast_fp16")]; tensor softmax_18_axis_0 = const()[name = tensor("softmax_18_axis_0"), val = tensor(-1)]; tensor softmax_18_cast_fp16 = softmax(axis = softmax_18_axis_0, x = matmul_18_cast_fp16)[name = tensor("softmax_18_cast_fp16")]; tensor attn_output_37_transpose_x_0 = const()[name = tensor("attn_output_37_transpose_x_0"), val = tensor(false)]; tensor attn_output_37_transpose_y_0 = const()[name = tensor("attn_output_37_transpose_y_0"), val = tensor(false)]; tensor value_75_cast_fp16 = transpose(perm = value_75_perm_0, x = var_1094_cast_fp16)[name = tensor("transpose_247")]; tensor attn_output_37_cast_fp16 = matmul(transpose_x = attn_output_37_transpose_x_0, transpose_y = attn_output_37_transpose_y_0, x = softmax_18_cast_fp16, y = value_75_cast_fp16)[name = tensor("attn_output_37_cast_fp16")]; tensor var_1097_perm_0 = const()[name = tensor("op_1097_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1099 = const()[name = tensor("op_1099"), val = tensor([1, 1500, 1280])]; tensor var_1097_cast_fp16 = transpose(perm = var_1097_perm_0, x = attn_output_37_cast_fp16)[name = tensor("transpose_244")]; tensor input_187_cast_fp16 = reshape(shape = var_1099, x = var_1097_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor encoder_layers_18_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732861696)))]; tensor encoder_layers_18_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_18_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736138560)))]; tensor linear_111_cast_fp16 = linear(bias = encoder_layers_18_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_18_self_attn_out_proj_weight_to_fp16, x = input_187_cast_fp16)[name = tensor("linear_111_cast_fp16")]; tensor input_189_cast_fp16 = add(x = input_185_cast_fp16, y = linear_111_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor input_191_axes_0 = const()[name = tensor("input_191_axes_0"), val = tensor([-1])]; tensor encoder_layers_18_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_18_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736141184)))]; tensor encoder_layers_18_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_18_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736143808)))]; tensor input_191_cast_fp16 = layer_norm(axes = input_191_axes_0, beta = encoder_layers_18_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_18_final_layer_norm_weight_to_fp16, x = input_189_cast_fp16)[name = tensor("input_191_cast_fp16")]; tensor encoder_layers_18_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_18_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736146432)))]; tensor encoder_layers_18_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_18_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(749253696)))]; tensor linear_112_cast_fp16 = linear(bias = encoder_layers_18_fc1_bias_to_fp16, weight = encoder_layers_18_fc1_weight_to_fp16, x = input_191_cast_fp16)[name = tensor("linear_112_cast_fp16")]; tensor input_193_mode_0 = const()[name = tensor("input_193_mode_0"), val = tensor("EXACT")]; tensor input_193_cast_fp16 = gelu(mode = input_193_mode_0, x = linear_112_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor encoder_layers_18_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_18_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(749264000)))]; tensor encoder_layers_18_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_18_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762371264)))]; tensor linear_113_cast_fp16 = linear(bias = encoder_layers_18_fc2_bias_to_fp16, weight = encoder_layers_18_fc2_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("linear_113_cast_fp16")]; tensor input_195_cast_fp16 = add(x = input_189_cast_fp16, y = linear_113_cast_fp16)[name = tensor("input_195_cast_fp16")]; tensor hidden_states_119_axes_0 = const()[name = tensor("hidden_states_119_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762373888)))]; tensor encoder_layers_19_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762376512)))]; tensor hidden_states_119_cast_fp16 = layer_norm(axes = hidden_states_119_axes_0, beta = encoder_layers_19_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_19_self_attn_layer_norm_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("hidden_states_119_cast_fp16")]; tensor encoder_layers_19_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762379136)))]; tensor encoder_layers_19_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765656000)))]; tensor linear_114_cast_fp16 = linear(bias = encoder_layers_19_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_19_self_attn_q_proj_weight_to_fp16, x = hidden_states_119_cast_fp16)[name = tensor("linear_114_cast_fp16")]; tensor encoder_layers_19_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765658624)))]; tensor linear_115_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_19_self_attn_k_proj_weight_to_fp16, x = hidden_states_119_cast_fp16)[name = tensor("linear_115_cast_fp16")]; tensor encoder_layers_19_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(768935488)))]; tensor encoder_layers_19_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772212352)))]; tensor linear_116_cast_fp16 = linear(bias = encoder_layers_19_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_19_self_attn_v_proj_weight_to_fp16, x = hidden_states_119_cast_fp16)[name = tensor("linear_116_cast_fp16")]; tensor var_1140 = const()[name = tensor("op_1140"), val = tensor([1, 1500, 20, 64])]; tensor var_1141_cast_fp16 = reshape(shape = var_1140, x = linear_114_cast_fp16)[name = tensor("op_1141_cast_fp16")]; tensor var_1143 = const()[name = tensor("op_1143"), val = tensor([1, 1500, 20, 64])]; tensor var_1144_cast_fp16 = reshape(shape = var_1143, x = linear_115_cast_fp16)[name = tensor("op_1144_cast_fp16")]; tensor var_1146 = const()[name = tensor("op_1146"), val = tensor([1, 1500, 20, 64])]; tensor var_1147_cast_fp16 = reshape(shape = var_1146, x = linear_116_cast_fp16)[name = tensor("op_1147_cast_fp16")]; tensor value_79_perm_0 = const()[name = tensor("value_79_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_19_cast_fp16 = mul(x = var_1141_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_19_cast_fp16")]; tensor matmul_19_transpose_y_0 = const()[name = tensor("matmul_19_transpose_y_0"), val = tensor(true)]; tensor matmul_19_transpose_x_0 = const()[name = tensor("matmul_19_transpose_x_0"), val = tensor(false)]; tensor transpose_166_perm_0 = const()[name = tensor("transpose_166_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_167_perm_0 = const()[name = tensor("transpose_167_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_167 = transpose(perm = transpose_167_perm_0, x = var_1144_cast_fp16)[name = tensor("transpose_241")]; tensor transpose_166 = transpose(perm = transpose_166_perm_0, x = mul_19_cast_fp16)[name = tensor("transpose_242")]; tensor matmul_19_cast_fp16 = matmul(transpose_x = matmul_19_transpose_x_0, transpose_y = matmul_19_transpose_y_0, x = transpose_166, y = transpose_167)[name = tensor("matmul_19_cast_fp16")]; tensor softmax_19_axis_0 = const()[name = tensor("softmax_19_axis_0"), val = tensor(-1)]; tensor softmax_19_cast_fp16 = softmax(axis = softmax_19_axis_0, x = matmul_19_cast_fp16)[name = tensor("softmax_19_cast_fp16")]; tensor attn_output_39_transpose_x_0 = const()[name = tensor("attn_output_39_transpose_x_0"), val = tensor(false)]; tensor attn_output_39_transpose_y_0 = const()[name = tensor("attn_output_39_transpose_y_0"), val = tensor(false)]; tensor value_79_cast_fp16 = transpose(perm = value_79_perm_0, x = var_1147_cast_fp16)[name = tensor("transpose_243")]; tensor attn_output_39_cast_fp16 = matmul(transpose_x = attn_output_39_transpose_x_0, transpose_y = attn_output_39_transpose_y_0, x = softmax_19_cast_fp16, y = value_79_cast_fp16)[name = tensor("attn_output_39_cast_fp16")]; tensor var_1150_perm_0 = const()[name = tensor("op_1150_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1152 = const()[name = tensor("op_1152"), val = tensor([1, 1500, 1280])]; tensor var_1150_cast_fp16 = transpose(perm = var_1150_perm_0, x = attn_output_39_cast_fp16)[name = tensor("transpose_240")]; tensor input_197_cast_fp16 = reshape(shape = var_1152, x = var_1150_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor encoder_layers_19_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772214976)))]; tensor encoder_layers_19_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_19_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775491840)))]; tensor linear_117_cast_fp16 = linear(bias = encoder_layers_19_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_19_self_attn_out_proj_weight_to_fp16, x = input_197_cast_fp16)[name = tensor("linear_117_cast_fp16")]; tensor input_199_cast_fp16 = add(x = input_195_cast_fp16, y = linear_117_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor input_201_axes_0 = const()[name = tensor("input_201_axes_0"), val = tensor([-1])]; tensor encoder_layers_19_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_19_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775494464)))]; tensor encoder_layers_19_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_19_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775497088)))]; tensor input_201_cast_fp16 = layer_norm(axes = input_201_axes_0, beta = encoder_layers_19_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_19_final_layer_norm_weight_to_fp16, x = input_199_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor encoder_layers_19_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_19_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775499712)))]; tensor encoder_layers_19_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_19_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(788606976)))]; tensor linear_118_cast_fp16 = linear(bias = encoder_layers_19_fc1_bias_to_fp16, weight = encoder_layers_19_fc1_weight_to_fp16, x = input_201_cast_fp16)[name = tensor("linear_118_cast_fp16")]; tensor input_203_mode_0 = const()[name = tensor("input_203_mode_0"), val = tensor("EXACT")]; tensor input_203_cast_fp16 = gelu(mode = input_203_mode_0, x = linear_118_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor encoder_layers_19_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_19_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(788617280)))]; tensor encoder_layers_19_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_19_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801724544)))]; tensor linear_119_cast_fp16 = linear(bias = encoder_layers_19_fc2_bias_to_fp16, weight = encoder_layers_19_fc2_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("linear_119_cast_fp16")]; tensor input_205_cast_fp16 = add(x = input_199_cast_fp16, y = linear_119_cast_fp16)[name = tensor("input_205_cast_fp16")]; tensor hidden_states_125_axes_0 = const()[name = tensor("hidden_states_125_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801727168)))]; tensor encoder_layers_20_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801729792)))]; tensor hidden_states_125_cast_fp16 = layer_norm(axes = hidden_states_125_axes_0, beta = encoder_layers_20_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_20_self_attn_layer_norm_weight_to_fp16, x = input_205_cast_fp16)[name = tensor("hidden_states_125_cast_fp16")]; tensor encoder_layers_20_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801732416)))]; tensor encoder_layers_20_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(805009280)))]; tensor linear_120_cast_fp16 = linear(bias = encoder_layers_20_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_20_self_attn_q_proj_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("linear_120_cast_fp16")]; tensor encoder_layers_20_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(805011904)))]; tensor linear_121_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_20_self_attn_k_proj_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("linear_121_cast_fp16")]; tensor encoder_layers_20_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(808288768)))]; tensor encoder_layers_20_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811565632)))]; tensor linear_122_cast_fp16 = linear(bias = encoder_layers_20_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_20_self_attn_v_proj_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("linear_122_cast_fp16")]; tensor var_1193 = const()[name = tensor("op_1193"), val = tensor([1, 1500, 20, 64])]; tensor var_1194_cast_fp16 = reshape(shape = var_1193, x = linear_120_cast_fp16)[name = tensor("op_1194_cast_fp16")]; tensor var_1196 = const()[name = tensor("op_1196"), val = tensor([1, 1500, 20, 64])]; tensor var_1197_cast_fp16 = reshape(shape = var_1196, x = linear_121_cast_fp16)[name = tensor("op_1197_cast_fp16")]; tensor var_1199 = const()[name = tensor("op_1199"), val = tensor([1, 1500, 20, 64])]; tensor var_1200_cast_fp16 = reshape(shape = var_1199, x = linear_122_cast_fp16)[name = tensor("op_1200_cast_fp16")]; tensor value_83_perm_0 = const()[name = tensor("value_83_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_20_cast_fp16 = mul(x = var_1194_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_20_cast_fp16")]; tensor matmul_20_transpose_y_0 = const()[name = tensor("matmul_20_transpose_y_0"), val = tensor(true)]; tensor matmul_20_transpose_x_0 = const()[name = tensor("matmul_20_transpose_x_0"), val = tensor(false)]; tensor transpose_168_perm_0 = const()[name = tensor("transpose_168_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_169_perm_0 = const()[name = tensor("transpose_169_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_169 = transpose(perm = transpose_169_perm_0, x = var_1197_cast_fp16)[name = tensor("transpose_237")]; tensor transpose_168 = transpose(perm = transpose_168_perm_0, x = mul_20_cast_fp16)[name = tensor("transpose_238")]; tensor matmul_20_cast_fp16 = matmul(transpose_x = matmul_20_transpose_x_0, transpose_y = matmul_20_transpose_y_0, x = transpose_168, y = transpose_169)[name = tensor("matmul_20_cast_fp16")]; tensor softmax_20_axis_0 = const()[name = tensor("softmax_20_axis_0"), val = tensor(-1)]; tensor softmax_20_cast_fp16 = softmax(axis = softmax_20_axis_0, x = matmul_20_cast_fp16)[name = tensor("softmax_20_cast_fp16")]; tensor attn_output_41_transpose_x_0 = const()[name = tensor("attn_output_41_transpose_x_0"), val = tensor(false)]; tensor attn_output_41_transpose_y_0 = const()[name = tensor("attn_output_41_transpose_y_0"), val = tensor(false)]; tensor value_83_cast_fp16 = transpose(perm = value_83_perm_0, x = var_1200_cast_fp16)[name = tensor("transpose_239")]; tensor attn_output_41_cast_fp16 = matmul(transpose_x = attn_output_41_transpose_x_0, transpose_y = attn_output_41_transpose_y_0, x = softmax_20_cast_fp16, y = value_83_cast_fp16)[name = tensor("attn_output_41_cast_fp16")]; tensor var_1203_perm_0 = const()[name = tensor("op_1203_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1205 = const()[name = tensor("op_1205"), val = tensor([1, 1500, 1280])]; tensor var_1203_cast_fp16 = transpose(perm = var_1203_perm_0, x = attn_output_41_cast_fp16)[name = tensor("transpose_236")]; tensor input_207_cast_fp16 = reshape(shape = var_1205, x = var_1203_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor encoder_layers_20_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811568256)))]; tensor encoder_layers_20_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_20_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814845120)))]; tensor linear_123_cast_fp16 = linear(bias = encoder_layers_20_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_20_self_attn_out_proj_weight_to_fp16, x = input_207_cast_fp16)[name = tensor("linear_123_cast_fp16")]; tensor input_209_cast_fp16 = add(x = input_205_cast_fp16, y = linear_123_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor input_211_axes_0 = const()[name = tensor("input_211_axes_0"), val = tensor([-1])]; tensor encoder_layers_20_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_20_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814847744)))]; tensor encoder_layers_20_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_20_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814850368)))]; tensor input_211_cast_fp16 = layer_norm(axes = input_211_axes_0, beta = encoder_layers_20_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_20_final_layer_norm_weight_to_fp16, x = input_209_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor encoder_layers_20_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_20_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814852992)))]; tensor encoder_layers_20_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_20_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(827960256)))]; tensor linear_124_cast_fp16 = linear(bias = encoder_layers_20_fc1_bias_to_fp16, weight = encoder_layers_20_fc1_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("linear_124_cast_fp16")]; tensor input_213_mode_0 = const()[name = tensor("input_213_mode_0"), val = tensor("EXACT")]; tensor input_213_cast_fp16 = gelu(mode = input_213_mode_0, x = linear_124_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor encoder_layers_20_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_20_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(827970560)))]; tensor encoder_layers_20_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_20_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841077824)))]; tensor linear_125_cast_fp16 = linear(bias = encoder_layers_20_fc2_bias_to_fp16, weight = encoder_layers_20_fc2_weight_to_fp16, x = input_213_cast_fp16)[name = tensor("linear_125_cast_fp16")]; tensor input_215_cast_fp16 = add(x = input_209_cast_fp16, y = linear_125_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor hidden_states_131_axes_0 = const()[name = tensor("hidden_states_131_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841080448)))]; tensor encoder_layers_21_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841083072)))]; tensor hidden_states_131_cast_fp16 = layer_norm(axes = hidden_states_131_axes_0, beta = encoder_layers_21_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_21_self_attn_layer_norm_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("hidden_states_131_cast_fp16")]; tensor encoder_layers_21_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841085696)))]; tensor encoder_layers_21_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844362560)))]; tensor linear_126_cast_fp16 = linear(bias = encoder_layers_21_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_21_self_attn_q_proj_weight_to_fp16, x = hidden_states_131_cast_fp16)[name = tensor("linear_126_cast_fp16")]; tensor encoder_layers_21_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844365184)))]; tensor linear_127_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_21_self_attn_k_proj_weight_to_fp16, x = hidden_states_131_cast_fp16)[name = tensor("linear_127_cast_fp16")]; tensor encoder_layers_21_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(847642048)))]; tensor encoder_layers_21_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(850918912)))]; tensor linear_128_cast_fp16 = linear(bias = encoder_layers_21_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_21_self_attn_v_proj_weight_to_fp16, x = hidden_states_131_cast_fp16)[name = tensor("linear_128_cast_fp16")]; tensor var_1246 = const()[name = tensor("op_1246"), val = tensor([1, 1500, 20, 64])]; tensor var_1247_cast_fp16 = reshape(shape = var_1246, x = linear_126_cast_fp16)[name = tensor("op_1247_cast_fp16")]; tensor var_1249 = const()[name = tensor("op_1249"), val = tensor([1, 1500, 20, 64])]; tensor var_1250_cast_fp16 = reshape(shape = var_1249, x = linear_127_cast_fp16)[name = tensor("op_1250_cast_fp16")]; tensor var_1252 = const()[name = tensor("op_1252"), val = tensor([1, 1500, 20, 64])]; tensor var_1253_cast_fp16 = reshape(shape = var_1252, x = linear_128_cast_fp16)[name = tensor("op_1253_cast_fp16")]; tensor value_87_perm_0 = const()[name = tensor("value_87_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_21_cast_fp16 = mul(x = var_1247_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_21_cast_fp16")]; tensor matmul_21_transpose_y_0 = const()[name = tensor("matmul_21_transpose_y_0"), val = tensor(true)]; tensor matmul_21_transpose_x_0 = const()[name = tensor("matmul_21_transpose_x_0"), val = tensor(false)]; tensor transpose_170_perm_0 = const()[name = tensor("transpose_170_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_171_perm_0 = const()[name = tensor("transpose_171_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_171 = transpose(perm = transpose_171_perm_0, x = var_1250_cast_fp16)[name = tensor("transpose_233")]; tensor transpose_170 = transpose(perm = transpose_170_perm_0, x = mul_21_cast_fp16)[name = tensor("transpose_234")]; tensor matmul_21_cast_fp16 = matmul(transpose_x = matmul_21_transpose_x_0, transpose_y = matmul_21_transpose_y_0, x = transpose_170, y = transpose_171)[name = tensor("matmul_21_cast_fp16")]; tensor softmax_21_axis_0 = const()[name = tensor("softmax_21_axis_0"), val = tensor(-1)]; tensor softmax_21_cast_fp16 = softmax(axis = softmax_21_axis_0, x = matmul_21_cast_fp16)[name = tensor("softmax_21_cast_fp16")]; tensor attn_output_43_transpose_x_0 = const()[name = tensor("attn_output_43_transpose_x_0"), val = tensor(false)]; tensor attn_output_43_transpose_y_0 = const()[name = tensor("attn_output_43_transpose_y_0"), val = tensor(false)]; tensor value_87_cast_fp16 = transpose(perm = value_87_perm_0, x = var_1253_cast_fp16)[name = tensor("transpose_235")]; tensor attn_output_43_cast_fp16 = matmul(transpose_x = attn_output_43_transpose_x_0, transpose_y = attn_output_43_transpose_y_0, x = softmax_21_cast_fp16, y = value_87_cast_fp16)[name = tensor("attn_output_43_cast_fp16")]; tensor var_1256_perm_0 = const()[name = tensor("op_1256_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1258 = const()[name = tensor("op_1258"), val = tensor([1, 1500, 1280])]; tensor var_1256_cast_fp16 = transpose(perm = var_1256_perm_0, x = attn_output_43_cast_fp16)[name = tensor("transpose_232")]; tensor input_217_cast_fp16 = reshape(shape = var_1258, x = var_1256_cast_fp16)[name = tensor("input_217_cast_fp16")]; tensor encoder_layers_21_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(850921536)))]; tensor encoder_layers_21_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_21_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854198400)))]; tensor linear_129_cast_fp16 = linear(bias = encoder_layers_21_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_21_self_attn_out_proj_weight_to_fp16, x = input_217_cast_fp16)[name = tensor("linear_129_cast_fp16")]; tensor input_219_cast_fp16 = add(x = input_215_cast_fp16, y = linear_129_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_axes_0 = const()[name = tensor("input_221_axes_0"), val = tensor([-1])]; tensor encoder_layers_21_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_21_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854201024)))]; tensor encoder_layers_21_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_21_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854203648)))]; tensor input_221_cast_fp16 = layer_norm(axes = input_221_axes_0, beta = encoder_layers_21_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_21_final_layer_norm_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor encoder_layers_21_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_21_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854206272)))]; tensor encoder_layers_21_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_21_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(867313536)))]; tensor linear_130_cast_fp16 = linear(bias = encoder_layers_21_fc1_bias_to_fp16, weight = encoder_layers_21_fc1_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("linear_130_cast_fp16")]; tensor input_223_mode_0 = const()[name = tensor("input_223_mode_0"), val = tensor("EXACT")]; tensor input_223_cast_fp16 = gelu(mode = input_223_mode_0, x = linear_130_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor encoder_layers_21_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_21_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(867323840)))]; tensor encoder_layers_21_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_21_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880431104)))]; tensor linear_131_cast_fp16 = linear(bias = encoder_layers_21_fc2_bias_to_fp16, weight = encoder_layers_21_fc2_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("linear_131_cast_fp16")]; tensor input_225_cast_fp16 = add(x = input_219_cast_fp16, y = linear_131_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor hidden_states_137_axes_0 = const()[name = tensor("hidden_states_137_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880433728)))]; tensor encoder_layers_22_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880436352)))]; tensor hidden_states_137_cast_fp16 = layer_norm(axes = hidden_states_137_axes_0, beta = encoder_layers_22_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_22_self_attn_layer_norm_weight_to_fp16, x = input_225_cast_fp16)[name = tensor("hidden_states_137_cast_fp16")]; tensor encoder_layers_22_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880438976)))]; tensor encoder_layers_22_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883715840)))]; tensor linear_132_cast_fp16 = linear(bias = encoder_layers_22_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_22_self_attn_q_proj_weight_to_fp16, x = hidden_states_137_cast_fp16)[name = tensor("linear_132_cast_fp16")]; tensor encoder_layers_22_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883718464)))]; tensor linear_133_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_22_self_attn_k_proj_weight_to_fp16, x = hidden_states_137_cast_fp16)[name = tensor("linear_133_cast_fp16")]; tensor encoder_layers_22_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(886995328)))]; tensor encoder_layers_22_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(890272192)))]; tensor linear_134_cast_fp16 = linear(bias = encoder_layers_22_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_22_self_attn_v_proj_weight_to_fp16, x = hidden_states_137_cast_fp16)[name = tensor("linear_134_cast_fp16")]; tensor var_1299 = const()[name = tensor("op_1299"), val = tensor([1, 1500, 20, 64])]; tensor var_1300_cast_fp16 = reshape(shape = var_1299, x = linear_132_cast_fp16)[name = tensor("op_1300_cast_fp16")]; tensor var_1302 = const()[name = tensor("op_1302"), val = tensor([1, 1500, 20, 64])]; tensor var_1303_cast_fp16 = reshape(shape = var_1302, x = linear_133_cast_fp16)[name = tensor("op_1303_cast_fp16")]; tensor var_1305 = const()[name = tensor("op_1305"), val = tensor([1, 1500, 20, 64])]; tensor var_1306_cast_fp16 = reshape(shape = var_1305, x = linear_134_cast_fp16)[name = tensor("op_1306_cast_fp16")]; tensor value_91_perm_0 = const()[name = tensor("value_91_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_22_cast_fp16 = mul(x = var_1300_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_22_cast_fp16")]; tensor matmul_22_transpose_y_0 = const()[name = tensor("matmul_22_transpose_y_0"), val = tensor(true)]; tensor matmul_22_transpose_x_0 = const()[name = tensor("matmul_22_transpose_x_0"), val = tensor(false)]; tensor transpose_172_perm_0 = const()[name = tensor("transpose_172_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_173_perm_0 = const()[name = tensor("transpose_173_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_173 = transpose(perm = transpose_173_perm_0, x = var_1303_cast_fp16)[name = tensor("transpose_229")]; tensor transpose_172 = transpose(perm = transpose_172_perm_0, x = mul_22_cast_fp16)[name = tensor("transpose_230")]; tensor matmul_22_cast_fp16 = matmul(transpose_x = matmul_22_transpose_x_0, transpose_y = matmul_22_transpose_y_0, x = transpose_172, y = transpose_173)[name = tensor("matmul_22_cast_fp16")]; tensor softmax_22_axis_0 = const()[name = tensor("softmax_22_axis_0"), val = tensor(-1)]; tensor softmax_22_cast_fp16 = softmax(axis = softmax_22_axis_0, x = matmul_22_cast_fp16)[name = tensor("softmax_22_cast_fp16")]; tensor attn_output_45_transpose_x_0 = const()[name = tensor("attn_output_45_transpose_x_0"), val = tensor(false)]; tensor attn_output_45_transpose_y_0 = const()[name = tensor("attn_output_45_transpose_y_0"), val = tensor(false)]; tensor value_91_cast_fp16 = transpose(perm = value_91_perm_0, x = var_1306_cast_fp16)[name = tensor("transpose_231")]; tensor attn_output_45_cast_fp16 = matmul(transpose_x = attn_output_45_transpose_x_0, transpose_y = attn_output_45_transpose_y_0, x = softmax_22_cast_fp16, y = value_91_cast_fp16)[name = tensor("attn_output_45_cast_fp16")]; tensor var_1309_perm_0 = const()[name = tensor("op_1309_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1311 = const()[name = tensor("op_1311"), val = tensor([1, 1500, 1280])]; tensor var_1309_cast_fp16 = transpose(perm = var_1309_perm_0, x = attn_output_45_cast_fp16)[name = tensor("transpose_228")]; tensor input_227_cast_fp16 = reshape(shape = var_1311, x = var_1309_cast_fp16)[name = tensor("input_227_cast_fp16")]; tensor encoder_layers_22_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(890274816)))]; tensor encoder_layers_22_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_22_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893551680)))]; tensor linear_135_cast_fp16 = linear(bias = encoder_layers_22_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_22_self_attn_out_proj_weight_to_fp16, x = input_227_cast_fp16)[name = tensor("linear_135_cast_fp16")]; tensor input_229_cast_fp16 = add(x = input_225_cast_fp16, y = linear_135_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor input_231_axes_0 = const()[name = tensor("input_231_axes_0"), val = tensor([-1])]; tensor encoder_layers_22_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_22_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893554304)))]; tensor encoder_layers_22_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_22_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893556928)))]; tensor input_231_cast_fp16 = layer_norm(axes = input_231_axes_0, beta = encoder_layers_22_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_22_final_layer_norm_weight_to_fp16, x = input_229_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor encoder_layers_22_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_22_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893559552)))]; tensor encoder_layers_22_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_22_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(906666816)))]; tensor linear_136_cast_fp16 = linear(bias = encoder_layers_22_fc1_bias_to_fp16, weight = encoder_layers_22_fc1_weight_to_fp16, x = input_231_cast_fp16)[name = tensor("linear_136_cast_fp16")]; tensor input_233_mode_0 = const()[name = tensor("input_233_mode_0"), val = tensor("EXACT")]; tensor input_233_cast_fp16 = gelu(mode = input_233_mode_0, x = linear_136_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor encoder_layers_22_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_22_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(906677120)))]; tensor encoder_layers_22_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_22_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919784384)))]; tensor linear_137_cast_fp16 = linear(bias = encoder_layers_22_fc2_bias_to_fp16, weight = encoder_layers_22_fc2_weight_to_fp16, x = input_233_cast_fp16)[name = tensor("linear_137_cast_fp16")]; tensor input_235_cast_fp16 = add(x = input_229_cast_fp16, y = linear_137_cast_fp16)[name = tensor("input_235_cast_fp16")]; tensor hidden_states_143_axes_0 = const()[name = tensor("hidden_states_143_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919787008)))]; tensor encoder_layers_23_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919789632)))]; tensor hidden_states_143_cast_fp16 = layer_norm(axes = hidden_states_143_axes_0, beta = encoder_layers_23_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_23_self_attn_layer_norm_weight_to_fp16, x = input_235_cast_fp16)[name = tensor("hidden_states_143_cast_fp16")]; tensor encoder_layers_23_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919792256)))]; tensor encoder_layers_23_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(923069120)))]; tensor linear_138_cast_fp16 = linear(bias = encoder_layers_23_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_23_self_attn_q_proj_weight_to_fp16, x = hidden_states_143_cast_fp16)[name = tensor("linear_138_cast_fp16")]; tensor encoder_layers_23_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(923071744)))]; tensor linear_139_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_23_self_attn_k_proj_weight_to_fp16, x = hidden_states_143_cast_fp16)[name = tensor("linear_139_cast_fp16")]; tensor encoder_layers_23_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(926348608)))]; tensor encoder_layers_23_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(929625472)))]; tensor linear_140_cast_fp16 = linear(bias = encoder_layers_23_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_23_self_attn_v_proj_weight_to_fp16, x = hidden_states_143_cast_fp16)[name = tensor("linear_140_cast_fp16")]; tensor var_1352 = const()[name = tensor("op_1352"), val = tensor([1, 1500, 20, 64])]; tensor var_1353_cast_fp16 = reshape(shape = var_1352, x = linear_138_cast_fp16)[name = tensor("op_1353_cast_fp16")]; tensor var_1355 = const()[name = tensor("op_1355"), val = tensor([1, 1500, 20, 64])]; tensor var_1356_cast_fp16 = reshape(shape = var_1355, x = linear_139_cast_fp16)[name = tensor("op_1356_cast_fp16")]; tensor var_1358 = const()[name = tensor("op_1358"), val = tensor([1, 1500, 20, 64])]; tensor var_1359_cast_fp16 = reshape(shape = var_1358, x = linear_140_cast_fp16)[name = tensor("op_1359_cast_fp16")]; tensor value_95_perm_0 = const()[name = tensor("value_95_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_23_cast_fp16 = mul(x = var_1353_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_23_cast_fp16")]; tensor matmul_23_transpose_y_0 = const()[name = tensor("matmul_23_transpose_y_0"), val = tensor(true)]; tensor matmul_23_transpose_x_0 = const()[name = tensor("matmul_23_transpose_x_0"), val = tensor(false)]; tensor transpose_174_perm_0 = const()[name = tensor("transpose_174_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_175_perm_0 = const()[name = tensor("transpose_175_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_175 = transpose(perm = transpose_175_perm_0, x = var_1356_cast_fp16)[name = tensor("transpose_225")]; tensor transpose_174 = transpose(perm = transpose_174_perm_0, x = mul_23_cast_fp16)[name = tensor("transpose_226")]; tensor matmul_23_cast_fp16 = matmul(transpose_x = matmul_23_transpose_x_0, transpose_y = matmul_23_transpose_y_0, x = transpose_174, y = transpose_175)[name = tensor("matmul_23_cast_fp16")]; tensor softmax_23_axis_0 = const()[name = tensor("softmax_23_axis_0"), val = tensor(-1)]; tensor softmax_23_cast_fp16 = softmax(axis = softmax_23_axis_0, x = matmul_23_cast_fp16)[name = tensor("softmax_23_cast_fp16")]; tensor attn_output_47_transpose_x_0 = const()[name = tensor("attn_output_47_transpose_x_0"), val = tensor(false)]; tensor attn_output_47_transpose_y_0 = const()[name = tensor("attn_output_47_transpose_y_0"), val = tensor(false)]; tensor value_95_cast_fp16 = transpose(perm = value_95_perm_0, x = var_1359_cast_fp16)[name = tensor("transpose_227")]; tensor attn_output_47_cast_fp16 = matmul(transpose_x = attn_output_47_transpose_x_0, transpose_y = attn_output_47_transpose_y_0, x = softmax_23_cast_fp16, y = value_95_cast_fp16)[name = tensor("attn_output_47_cast_fp16")]; tensor var_1362_perm_0 = const()[name = tensor("op_1362_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1364 = const()[name = tensor("op_1364"), val = tensor([1, 1500, 1280])]; tensor var_1362_cast_fp16 = transpose(perm = var_1362_perm_0, x = attn_output_47_cast_fp16)[name = tensor("transpose_224")]; tensor input_237_cast_fp16 = reshape(shape = var_1364, x = var_1362_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor encoder_layers_23_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(929628096)))]; tensor encoder_layers_23_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_23_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932904960)))]; tensor linear_141_cast_fp16 = linear(bias = encoder_layers_23_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_23_self_attn_out_proj_weight_to_fp16, x = input_237_cast_fp16)[name = tensor("linear_141_cast_fp16")]; tensor input_239_cast_fp16 = add(x = input_235_cast_fp16, y = linear_141_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor input_241_axes_0 = const()[name = tensor("input_241_axes_0"), val = tensor([-1])]; tensor encoder_layers_23_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_23_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932907584)))]; tensor encoder_layers_23_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_23_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932910208)))]; tensor input_241_cast_fp16 = layer_norm(axes = input_241_axes_0, beta = encoder_layers_23_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_23_final_layer_norm_weight_to_fp16, x = input_239_cast_fp16)[name = tensor("input_241_cast_fp16")]; tensor encoder_layers_23_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_23_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932912832)))]; tensor encoder_layers_23_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_23_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(946020096)))]; tensor linear_142_cast_fp16 = linear(bias = encoder_layers_23_fc1_bias_to_fp16, weight = encoder_layers_23_fc1_weight_to_fp16, x = input_241_cast_fp16)[name = tensor("linear_142_cast_fp16")]; tensor input_243_mode_0 = const()[name = tensor("input_243_mode_0"), val = tensor("EXACT")]; tensor input_243_cast_fp16 = gelu(mode = input_243_mode_0, x = linear_142_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor encoder_layers_23_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_23_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(946030400)))]; tensor encoder_layers_23_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_23_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959137664)))]; tensor linear_143_cast_fp16 = linear(bias = encoder_layers_23_fc2_bias_to_fp16, weight = encoder_layers_23_fc2_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("linear_143_cast_fp16")]; tensor input_245_cast_fp16 = add(x = input_239_cast_fp16, y = linear_143_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor hidden_states_149_axes_0 = const()[name = tensor("hidden_states_149_axes_0"), val = tensor([-1])]; tensor encoder_layers_24_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959140288)))]; tensor encoder_layers_24_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959142912)))]; tensor hidden_states_149_cast_fp16 = layer_norm(axes = hidden_states_149_axes_0, beta = encoder_layers_24_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_24_self_attn_layer_norm_weight_to_fp16, x = input_245_cast_fp16)[name = tensor("hidden_states_149_cast_fp16")]; tensor encoder_layers_24_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959145536)))]; tensor encoder_layers_24_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962422400)))]; tensor linear_144_cast_fp16 = linear(bias = encoder_layers_24_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_24_self_attn_q_proj_weight_to_fp16, x = hidden_states_149_cast_fp16)[name = tensor("linear_144_cast_fp16")]; tensor encoder_layers_24_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962425024)))]; tensor linear_145_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_24_self_attn_k_proj_weight_to_fp16, x = hidden_states_149_cast_fp16)[name = tensor("linear_145_cast_fp16")]; tensor encoder_layers_24_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(965701888)))]; tensor encoder_layers_24_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(968978752)))]; tensor linear_146_cast_fp16 = linear(bias = encoder_layers_24_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_24_self_attn_v_proj_weight_to_fp16, x = hidden_states_149_cast_fp16)[name = tensor("linear_146_cast_fp16")]; tensor var_1405 = const()[name = tensor("op_1405"), val = tensor([1, 1500, 20, 64])]; tensor var_1406_cast_fp16 = reshape(shape = var_1405, x = linear_144_cast_fp16)[name = tensor("op_1406_cast_fp16")]; tensor var_1408 = const()[name = tensor("op_1408"), val = tensor([1, 1500, 20, 64])]; tensor var_1409_cast_fp16 = reshape(shape = var_1408, x = linear_145_cast_fp16)[name = tensor("op_1409_cast_fp16")]; tensor var_1411 = const()[name = tensor("op_1411"), val = tensor([1, 1500, 20, 64])]; tensor var_1412_cast_fp16 = reshape(shape = var_1411, x = linear_146_cast_fp16)[name = tensor("op_1412_cast_fp16")]; tensor value_99_perm_0 = const()[name = tensor("value_99_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_24_cast_fp16 = mul(x = var_1406_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_24_cast_fp16")]; tensor matmul_24_transpose_y_0 = const()[name = tensor("matmul_24_transpose_y_0"), val = tensor(true)]; tensor matmul_24_transpose_x_0 = const()[name = tensor("matmul_24_transpose_x_0"), val = tensor(false)]; tensor transpose_176_perm_0 = const()[name = tensor("transpose_176_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_177_perm_0 = const()[name = tensor("transpose_177_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_177 = transpose(perm = transpose_177_perm_0, x = var_1409_cast_fp16)[name = tensor("transpose_221")]; tensor transpose_176 = transpose(perm = transpose_176_perm_0, x = mul_24_cast_fp16)[name = tensor("transpose_222")]; tensor matmul_24_cast_fp16 = matmul(transpose_x = matmul_24_transpose_x_0, transpose_y = matmul_24_transpose_y_0, x = transpose_176, y = transpose_177)[name = tensor("matmul_24_cast_fp16")]; tensor softmax_24_axis_0 = const()[name = tensor("softmax_24_axis_0"), val = tensor(-1)]; tensor softmax_24_cast_fp16 = softmax(axis = softmax_24_axis_0, x = matmul_24_cast_fp16)[name = tensor("softmax_24_cast_fp16")]; tensor attn_output_49_transpose_x_0 = const()[name = tensor("attn_output_49_transpose_x_0"), val = tensor(false)]; tensor attn_output_49_transpose_y_0 = const()[name = tensor("attn_output_49_transpose_y_0"), val = tensor(false)]; tensor value_99_cast_fp16 = transpose(perm = value_99_perm_0, x = var_1412_cast_fp16)[name = tensor("transpose_223")]; tensor attn_output_49_cast_fp16 = matmul(transpose_x = attn_output_49_transpose_x_0, transpose_y = attn_output_49_transpose_y_0, x = softmax_24_cast_fp16, y = value_99_cast_fp16)[name = tensor("attn_output_49_cast_fp16")]; tensor var_1415_perm_0 = const()[name = tensor("op_1415_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1417 = const()[name = tensor("op_1417"), val = tensor([1, 1500, 1280])]; tensor var_1415_cast_fp16 = transpose(perm = var_1415_perm_0, x = attn_output_49_cast_fp16)[name = tensor("transpose_220")]; tensor input_247_cast_fp16 = reshape(shape = var_1417, x = var_1415_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor encoder_layers_24_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(968981376)))]; tensor encoder_layers_24_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_24_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972258240)))]; tensor linear_147_cast_fp16 = linear(bias = encoder_layers_24_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_24_self_attn_out_proj_weight_to_fp16, x = input_247_cast_fp16)[name = tensor("linear_147_cast_fp16")]; tensor input_249_cast_fp16 = add(x = input_245_cast_fp16, y = linear_147_cast_fp16)[name = tensor("input_249_cast_fp16")]; tensor input_251_axes_0 = const()[name = tensor("input_251_axes_0"), val = tensor([-1])]; tensor encoder_layers_24_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_24_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972260864)))]; tensor encoder_layers_24_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_24_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972263488)))]; tensor input_251_cast_fp16 = layer_norm(axes = input_251_axes_0, beta = encoder_layers_24_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_24_final_layer_norm_weight_to_fp16, x = input_249_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor encoder_layers_24_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_24_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972266112)))]; tensor encoder_layers_24_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_24_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985373376)))]; tensor linear_148_cast_fp16 = linear(bias = encoder_layers_24_fc1_bias_to_fp16, weight = encoder_layers_24_fc1_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("linear_148_cast_fp16")]; tensor input_253_mode_0 = const()[name = tensor("input_253_mode_0"), val = tensor("EXACT")]; tensor input_253_cast_fp16 = gelu(mode = input_253_mode_0, x = linear_148_cast_fp16)[name = tensor("input_253_cast_fp16")]; tensor encoder_layers_24_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_24_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985383680)))]; tensor encoder_layers_24_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_24_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998490944)))]; tensor linear_149_cast_fp16 = linear(bias = encoder_layers_24_fc2_bias_to_fp16, weight = encoder_layers_24_fc2_weight_to_fp16, x = input_253_cast_fp16)[name = tensor("linear_149_cast_fp16")]; tensor input_255_cast_fp16 = add(x = input_249_cast_fp16, y = linear_149_cast_fp16)[name = tensor("input_255_cast_fp16")]; tensor hidden_states_155_axes_0 = const()[name = tensor("hidden_states_155_axes_0"), val = tensor([-1])]; tensor encoder_layers_25_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998493568)))]; tensor encoder_layers_25_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998496192)))]; tensor hidden_states_155_cast_fp16 = layer_norm(axes = hidden_states_155_axes_0, beta = encoder_layers_25_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_25_self_attn_layer_norm_weight_to_fp16, x = input_255_cast_fp16)[name = tensor("hidden_states_155_cast_fp16")]; tensor encoder_layers_25_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998498816)))]; tensor encoder_layers_25_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001775680)))]; tensor linear_150_cast_fp16 = linear(bias = encoder_layers_25_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_25_self_attn_q_proj_weight_to_fp16, x = hidden_states_155_cast_fp16)[name = tensor("linear_150_cast_fp16")]; tensor encoder_layers_25_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001778304)))]; tensor linear_151_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_25_self_attn_k_proj_weight_to_fp16, x = hidden_states_155_cast_fp16)[name = tensor("linear_151_cast_fp16")]; tensor encoder_layers_25_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1005055168)))]; tensor encoder_layers_25_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1008332032)))]; tensor linear_152_cast_fp16 = linear(bias = encoder_layers_25_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_25_self_attn_v_proj_weight_to_fp16, x = hidden_states_155_cast_fp16)[name = tensor("linear_152_cast_fp16")]; tensor var_1458 = const()[name = tensor("op_1458"), val = tensor([1, 1500, 20, 64])]; tensor var_1459_cast_fp16 = reshape(shape = var_1458, x = linear_150_cast_fp16)[name = tensor("op_1459_cast_fp16")]; tensor var_1461 = const()[name = tensor("op_1461"), val = tensor([1, 1500, 20, 64])]; tensor var_1462_cast_fp16 = reshape(shape = var_1461, x = linear_151_cast_fp16)[name = tensor("op_1462_cast_fp16")]; tensor var_1464 = const()[name = tensor("op_1464"), val = tensor([1, 1500, 20, 64])]; tensor var_1465_cast_fp16 = reshape(shape = var_1464, x = linear_152_cast_fp16)[name = tensor("op_1465_cast_fp16")]; tensor value_103_perm_0 = const()[name = tensor("value_103_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_25_cast_fp16 = mul(x = var_1459_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_25_cast_fp16")]; tensor matmul_25_transpose_y_0 = const()[name = tensor("matmul_25_transpose_y_0"), val = tensor(true)]; tensor matmul_25_transpose_x_0 = const()[name = tensor("matmul_25_transpose_x_0"), val = tensor(false)]; tensor transpose_178_perm_0 = const()[name = tensor("transpose_178_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_179_perm_0 = const()[name = tensor("transpose_179_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_179 = transpose(perm = transpose_179_perm_0, x = var_1462_cast_fp16)[name = tensor("transpose_217")]; tensor transpose_178 = transpose(perm = transpose_178_perm_0, x = mul_25_cast_fp16)[name = tensor("transpose_218")]; tensor matmul_25_cast_fp16 = matmul(transpose_x = matmul_25_transpose_x_0, transpose_y = matmul_25_transpose_y_0, x = transpose_178, y = transpose_179)[name = tensor("matmul_25_cast_fp16")]; tensor softmax_25_axis_0 = const()[name = tensor("softmax_25_axis_0"), val = tensor(-1)]; tensor softmax_25_cast_fp16 = softmax(axis = softmax_25_axis_0, x = matmul_25_cast_fp16)[name = tensor("softmax_25_cast_fp16")]; tensor attn_output_51_transpose_x_0 = const()[name = tensor("attn_output_51_transpose_x_0"), val = tensor(false)]; tensor attn_output_51_transpose_y_0 = const()[name = tensor("attn_output_51_transpose_y_0"), val = tensor(false)]; tensor value_103_cast_fp16 = transpose(perm = value_103_perm_0, x = var_1465_cast_fp16)[name = tensor("transpose_219")]; tensor attn_output_51_cast_fp16 = matmul(transpose_x = attn_output_51_transpose_x_0, transpose_y = attn_output_51_transpose_y_0, x = softmax_25_cast_fp16, y = value_103_cast_fp16)[name = tensor("attn_output_51_cast_fp16")]; tensor var_1468_perm_0 = const()[name = tensor("op_1468_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1470 = const()[name = tensor("op_1470"), val = tensor([1, 1500, 1280])]; tensor var_1468_cast_fp16 = transpose(perm = var_1468_perm_0, x = attn_output_51_cast_fp16)[name = tensor("transpose_216")]; tensor input_257_cast_fp16 = reshape(shape = var_1470, x = var_1468_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor encoder_layers_25_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1008334656)))]; tensor encoder_layers_25_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_25_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011611520)))]; tensor linear_153_cast_fp16 = linear(bias = encoder_layers_25_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_25_self_attn_out_proj_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("linear_153_cast_fp16")]; tensor input_259_cast_fp16 = add(x = input_255_cast_fp16, y = linear_153_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor input_261_axes_0 = const()[name = tensor("input_261_axes_0"), val = tensor([-1])]; tensor encoder_layers_25_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_25_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011614144)))]; tensor encoder_layers_25_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_25_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011616768)))]; tensor input_261_cast_fp16 = layer_norm(axes = input_261_axes_0, beta = encoder_layers_25_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_25_final_layer_norm_weight_to_fp16, x = input_259_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor encoder_layers_25_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_25_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011619392)))]; tensor encoder_layers_25_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_25_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1024726656)))]; tensor linear_154_cast_fp16 = linear(bias = encoder_layers_25_fc1_bias_to_fp16, weight = encoder_layers_25_fc1_weight_to_fp16, x = input_261_cast_fp16)[name = tensor("linear_154_cast_fp16")]; tensor input_263_mode_0 = const()[name = tensor("input_263_mode_0"), val = tensor("EXACT")]; tensor input_263_cast_fp16 = gelu(mode = input_263_mode_0, x = linear_154_cast_fp16)[name = tensor("input_263_cast_fp16")]; tensor encoder_layers_25_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_25_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1024736960)))]; tensor encoder_layers_25_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_25_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037844224)))]; tensor linear_155_cast_fp16 = linear(bias = encoder_layers_25_fc2_bias_to_fp16, weight = encoder_layers_25_fc2_weight_to_fp16, x = input_263_cast_fp16)[name = tensor("linear_155_cast_fp16")]; tensor input_265_cast_fp16 = add(x = input_259_cast_fp16, y = linear_155_cast_fp16)[name = tensor("input_265_cast_fp16")]; tensor hidden_states_161_axes_0 = const()[name = tensor("hidden_states_161_axes_0"), val = tensor([-1])]; tensor encoder_layers_26_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037846848)))]; tensor encoder_layers_26_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037849472)))]; tensor hidden_states_161_cast_fp16 = layer_norm(axes = hidden_states_161_axes_0, beta = encoder_layers_26_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_26_self_attn_layer_norm_weight_to_fp16, x = input_265_cast_fp16)[name = tensor("hidden_states_161_cast_fp16")]; tensor encoder_layers_26_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037852096)))]; tensor encoder_layers_26_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1041128960)))]; tensor linear_156_cast_fp16 = linear(bias = encoder_layers_26_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_26_self_attn_q_proj_weight_to_fp16, x = hidden_states_161_cast_fp16)[name = tensor("linear_156_cast_fp16")]; tensor encoder_layers_26_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1041131584)))]; tensor linear_157_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_26_self_attn_k_proj_weight_to_fp16, x = hidden_states_161_cast_fp16)[name = tensor("linear_157_cast_fp16")]; tensor encoder_layers_26_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1044408448)))]; tensor encoder_layers_26_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047685312)))]; tensor linear_158_cast_fp16 = linear(bias = encoder_layers_26_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_26_self_attn_v_proj_weight_to_fp16, x = hidden_states_161_cast_fp16)[name = tensor("linear_158_cast_fp16")]; tensor var_1511 = const()[name = tensor("op_1511"), val = tensor([1, 1500, 20, 64])]; tensor var_1512_cast_fp16 = reshape(shape = var_1511, x = linear_156_cast_fp16)[name = tensor("op_1512_cast_fp16")]; tensor var_1514 = const()[name = tensor("op_1514"), val = tensor([1, 1500, 20, 64])]; tensor var_1515_cast_fp16 = reshape(shape = var_1514, x = linear_157_cast_fp16)[name = tensor("op_1515_cast_fp16")]; tensor var_1517 = const()[name = tensor("op_1517"), val = tensor([1, 1500, 20, 64])]; tensor var_1518_cast_fp16 = reshape(shape = var_1517, x = linear_158_cast_fp16)[name = tensor("op_1518_cast_fp16")]; tensor value_107_perm_0 = const()[name = tensor("value_107_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_26_cast_fp16 = mul(x = var_1512_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_26_cast_fp16")]; tensor matmul_26_transpose_y_0 = const()[name = tensor("matmul_26_transpose_y_0"), val = tensor(true)]; tensor matmul_26_transpose_x_0 = const()[name = tensor("matmul_26_transpose_x_0"), val = tensor(false)]; tensor transpose_180_perm_0 = const()[name = tensor("transpose_180_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_181_perm_0 = const()[name = tensor("transpose_181_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_181 = transpose(perm = transpose_181_perm_0, x = var_1515_cast_fp16)[name = tensor("transpose_213")]; tensor transpose_180 = transpose(perm = transpose_180_perm_0, x = mul_26_cast_fp16)[name = tensor("transpose_214")]; tensor matmul_26_cast_fp16 = matmul(transpose_x = matmul_26_transpose_x_0, transpose_y = matmul_26_transpose_y_0, x = transpose_180, y = transpose_181)[name = tensor("matmul_26_cast_fp16")]; tensor softmax_26_axis_0 = const()[name = tensor("softmax_26_axis_0"), val = tensor(-1)]; tensor softmax_26_cast_fp16 = softmax(axis = softmax_26_axis_0, x = matmul_26_cast_fp16)[name = tensor("softmax_26_cast_fp16")]; tensor attn_output_53_transpose_x_0 = const()[name = tensor("attn_output_53_transpose_x_0"), val = tensor(false)]; tensor attn_output_53_transpose_y_0 = const()[name = tensor("attn_output_53_transpose_y_0"), val = tensor(false)]; tensor value_107_cast_fp16 = transpose(perm = value_107_perm_0, x = var_1518_cast_fp16)[name = tensor("transpose_215")]; tensor attn_output_53_cast_fp16 = matmul(transpose_x = attn_output_53_transpose_x_0, transpose_y = attn_output_53_transpose_y_0, x = softmax_26_cast_fp16, y = value_107_cast_fp16)[name = tensor("attn_output_53_cast_fp16")]; tensor var_1521_perm_0 = const()[name = tensor("op_1521_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1523 = const()[name = tensor("op_1523"), val = tensor([1, 1500, 1280])]; tensor var_1521_cast_fp16 = transpose(perm = var_1521_perm_0, x = attn_output_53_cast_fp16)[name = tensor("transpose_212")]; tensor input_267_cast_fp16 = reshape(shape = var_1523, x = var_1521_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor encoder_layers_26_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047687936)))]; tensor encoder_layers_26_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_26_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050964800)))]; tensor linear_159_cast_fp16 = linear(bias = encoder_layers_26_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_26_self_attn_out_proj_weight_to_fp16, x = input_267_cast_fp16)[name = tensor("linear_159_cast_fp16")]; tensor input_269_cast_fp16 = add(x = input_265_cast_fp16, y = linear_159_cast_fp16)[name = tensor("input_269_cast_fp16")]; tensor input_271_axes_0 = const()[name = tensor("input_271_axes_0"), val = tensor([-1])]; tensor encoder_layers_26_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_26_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050967424)))]; tensor encoder_layers_26_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_26_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050970048)))]; tensor input_271_cast_fp16 = layer_norm(axes = input_271_axes_0, beta = encoder_layers_26_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_26_final_layer_norm_weight_to_fp16, x = input_269_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor encoder_layers_26_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_26_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050972672)))]; tensor encoder_layers_26_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_26_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064079936)))]; tensor linear_160_cast_fp16 = linear(bias = encoder_layers_26_fc1_bias_to_fp16, weight = encoder_layers_26_fc1_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("linear_160_cast_fp16")]; tensor input_273_mode_0 = const()[name = tensor("input_273_mode_0"), val = tensor("EXACT")]; tensor input_273_cast_fp16 = gelu(mode = input_273_mode_0, x = linear_160_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor encoder_layers_26_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_26_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064090240)))]; tensor encoder_layers_26_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_26_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077197504)))]; tensor linear_161_cast_fp16 = linear(bias = encoder_layers_26_fc2_bias_to_fp16, weight = encoder_layers_26_fc2_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("linear_161_cast_fp16")]; tensor input_275_cast_fp16 = add(x = input_269_cast_fp16, y = linear_161_cast_fp16)[name = tensor("input_275_cast_fp16")]; tensor hidden_states_167_axes_0 = const()[name = tensor("hidden_states_167_axes_0"), val = tensor([-1])]; tensor encoder_layers_27_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077200128)))]; tensor encoder_layers_27_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077202752)))]; tensor hidden_states_167_cast_fp16 = layer_norm(axes = hidden_states_167_axes_0, beta = encoder_layers_27_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_27_self_attn_layer_norm_weight_to_fp16, x = input_275_cast_fp16)[name = tensor("hidden_states_167_cast_fp16")]; tensor encoder_layers_27_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077205376)))]; tensor encoder_layers_27_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1080482240)))]; tensor linear_162_cast_fp16 = linear(bias = encoder_layers_27_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_27_self_attn_q_proj_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("linear_162_cast_fp16")]; tensor encoder_layers_27_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1080484864)))]; tensor linear_163_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_27_self_attn_k_proj_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("linear_163_cast_fp16")]; tensor encoder_layers_27_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1083761728)))]; tensor encoder_layers_27_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1087038592)))]; tensor linear_164_cast_fp16 = linear(bias = encoder_layers_27_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_27_self_attn_v_proj_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("linear_164_cast_fp16")]; tensor var_1564 = const()[name = tensor("op_1564"), val = tensor([1, 1500, 20, 64])]; tensor var_1565_cast_fp16 = reshape(shape = var_1564, x = linear_162_cast_fp16)[name = tensor("op_1565_cast_fp16")]; tensor var_1567 = const()[name = tensor("op_1567"), val = tensor([1, 1500, 20, 64])]; tensor var_1568_cast_fp16 = reshape(shape = var_1567, x = linear_163_cast_fp16)[name = tensor("op_1568_cast_fp16")]; tensor var_1570 = const()[name = tensor("op_1570"), val = tensor([1, 1500, 20, 64])]; tensor var_1571_cast_fp16 = reshape(shape = var_1570, x = linear_164_cast_fp16)[name = tensor("op_1571_cast_fp16")]; tensor value_111_perm_0 = const()[name = tensor("value_111_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_27_cast_fp16 = mul(x = var_1565_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_27_cast_fp16")]; tensor matmul_27_transpose_y_0 = const()[name = tensor("matmul_27_transpose_y_0"), val = tensor(true)]; tensor matmul_27_transpose_x_0 = const()[name = tensor("matmul_27_transpose_x_0"), val = tensor(false)]; tensor transpose_182_perm_0 = const()[name = tensor("transpose_182_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_183_perm_0 = const()[name = tensor("transpose_183_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_183 = transpose(perm = transpose_183_perm_0, x = var_1568_cast_fp16)[name = tensor("transpose_209")]; tensor transpose_182 = transpose(perm = transpose_182_perm_0, x = mul_27_cast_fp16)[name = tensor("transpose_210")]; tensor matmul_27_cast_fp16 = matmul(transpose_x = matmul_27_transpose_x_0, transpose_y = matmul_27_transpose_y_0, x = transpose_182, y = transpose_183)[name = tensor("matmul_27_cast_fp16")]; tensor softmax_27_axis_0 = const()[name = tensor("softmax_27_axis_0"), val = tensor(-1)]; tensor softmax_27_cast_fp16 = softmax(axis = softmax_27_axis_0, x = matmul_27_cast_fp16)[name = tensor("softmax_27_cast_fp16")]; tensor attn_output_55_transpose_x_0 = const()[name = tensor("attn_output_55_transpose_x_0"), val = tensor(false)]; tensor attn_output_55_transpose_y_0 = const()[name = tensor("attn_output_55_transpose_y_0"), val = tensor(false)]; tensor value_111_cast_fp16 = transpose(perm = value_111_perm_0, x = var_1571_cast_fp16)[name = tensor("transpose_211")]; tensor attn_output_55_cast_fp16 = matmul(transpose_x = attn_output_55_transpose_x_0, transpose_y = attn_output_55_transpose_y_0, x = softmax_27_cast_fp16, y = value_111_cast_fp16)[name = tensor("attn_output_55_cast_fp16")]; tensor var_1574_perm_0 = const()[name = tensor("op_1574_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1576 = const()[name = tensor("op_1576"), val = tensor([1, 1500, 1280])]; tensor var_1574_cast_fp16 = transpose(perm = var_1574_perm_0, x = attn_output_55_cast_fp16)[name = tensor("transpose_208")]; tensor input_277_cast_fp16 = reshape(shape = var_1576, x = var_1574_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor encoder_layers_27_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1087041216)))]; tensor encoder_layers_27_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_27_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090318080)))]; tensor linear_165_cast_fp16 = linear(bias = encoder_layers_27_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_27_self_attn_out_proj_weight_to_fp16, x = input_277_cast_fp16)[name = tensor("linear_165_cast_fp16")]; tensor input_279_cast_fp16 = add(x = input_275_cast_fp16, y = linear_165_cast_fp16)[name = tensor("input_279_cast_fp16")]; tensor input_281_axes_0 = const()[name = tensor("input_281_axes_0"), val = tensor([-1])]; tensor encoder_layers_27_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_27_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090320704)))]; tensor encoder_layers_27_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_27_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090323328)))]; tensor input_281_cast_fp16 = layer_norm(axes = input_281_axes_0, beta = encoder_layers_27_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_27_final_layer_norm_weight_to_fp16, x = input_279_cast_fp16)[name = tensor("input_281_cast_fp16")]; tensor encoder_layers_27_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_27_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090325952)))]; tensor encoder_layers_27_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_27_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1103433216)))]; tensor linear_166_cast_fp16 = linear(bias = encoder_layers_27_fc1_bias_to_fp16, weight = encoder_layers_27_fc1_weight_to_fp16, x = input_281_cast_fp16)[name = tensor("linear_166_cast_fp16")]; tensor input_283_mode_0 = const()[name = tensor("input_283_mode_0"), val = tensor("EXACT")]; tensor input_283_cast_fp16 = gelu(mode = input_283_mode_0, x = linear_166_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor encoder_layers_27_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_27_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1103443520)))]; tensor encoder_layers_27_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_27_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116550784)))]; tensor linear_167_cast_fp16 = linear(bias = encoder_layers_27_fc2_bias_to_fp16, weight = encoder_layers_27_fc2_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("linear_167_cast_fp16")]; tensor input_285_cast_fp16 = add(x = input_279_cast_fp16, y = linear_167_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor hidden_states_173_axes_0 = const()[name = tensor("hidden_states_173_axes_0"), val = tensor([-1])]; tensor encoder_layers_28_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116553408)))]; tensor encoder_layers_28_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116556032)))]; tensor hidden_states_173_cast_fp16 = layer_norm(axes = hidden_states_173_axes_0, beta = encoder_layers_28_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_28_self_attn_layer_norm_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("hidden_states_173_cast_fp16")]; tensor encoder_layers_28_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116558656)))]; tensor encoder_layers_28_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119835520)))]; tensor linear_168_cast_fp16 = linear(bias = encoder_layers_28_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_28_self_attn_q_proj_weight_to_fp16, x = hidden_states_173_cast_fp16)[name = tensor("linear_168_cast_fp16")]; tensor encoder_layers_28_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119838144)))]; tensor linear_169_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_28_self_attn_k_proj_weight_to_fp16, x = hidden_states_173_cast_fp16)[name = tensor("linear_169_cast_fp16")]; tensor encoder_layers_28_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1123115008)))]; tensor encoder_layers_28_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126391872)))]; tensor linear_170_cast_fp16 = linear(bias = encoder_layers_28_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_28_self_attn_v_proj_weight_to_fp16, x = hidden_states_173_cast_fp16)[name = tensor("linear_170_cast_fp16")]; tensor var_1617 = const()[name = tensor("op_1617"), val = tensor([1, 1500, 20, 64])]; tensor var_1618_cast_fp16 = reshape(shape = var_1617, x = linear_168_cast_fp16)[name = tensor("op_1618_cast_fp16")]; tensor var_1620 = const()[name = tensor("op_1620"), val = tensor([1, 1500, 20, 64])]; tensor var_1621_cast_fp16 = reshape(shape = var_1620, x = linear_169_cast_fp16)[name = tensor("op_1621_cast_fp16")]; tensor var_1623 = const()[name = tensor("op_1623"), val = tensor([1, 1500, 20, 64])]; tensor var_1624_cast_fp16 = reshape(shape = var_1623, x = linear_170_cast_fp16)[name = tensor("op_1624_cast_fp16")]; tensor value_115_perm_0 = const()[name = tensor("value_115_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_28_cast_fp16 = mul(x = var_1618_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_28_cast_fp16")]; tensor matmul_28_transpose_y_0 = const()[name = tensor("matmul_28_transpose_y_0"), val = tensor(true)]; tensor matmul_28_transpose_x_0 = const()[name = tensor("matmul_28_transpose_x_0"), val = tensor(false)]; tensor transpose_184_perm_0 = const()[name = tensor("transpose_184_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_185_perm_0 = const()[name = tensor("transpose_185_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_185 = transpose(perm = transpose_185_perm_0, x = var_1621_cast_fp16)[name = tensor("transpose_205")]; tensor transpose_184 = transpose(perm = transpose_184_perm_0, x = mul_28_cast_fp16)[name = tensor("transpose_206")]; tensor matmul_28_cast_fp16 = matmul(transpose_x = matmul_28_transpose_x_0, transpose_y = matmul_28_transpose_y_0, x = transpose_184, y = transpose_185)[name = tensor("matmul_28_cast_fp16")]; tensor softmax_28_axis_0 = const()[name = tensor("softmax_28_axis_0"), val = tensor(-1)]; tensor softmax_28_cast_fp16 = softmax(axis = softmax_28_axis_0, x = matmul_28_cast_fp16)[name = tensor("softmax_28_cast_fp16")]; tensor attn_output_57_transpose_x_0 = const()[name = tensor("attn_output_57_transpose_x_0"), val = tensor(false)]; tensor attn_output_57_transpose_y_0 = const()[name = tensor("attn_output_57_transpose_y_0"), val = tensor(false)]; tensor value_115_cast_fp16 = transpose(perm = value_115_perm_0, x = var_1624_cast_fp16)[name = tensor("transpose_207")]; tensor attn_output_57_cast_fp16 = matmul(transpose_x = attn_output_57_transpose_x_0, transpose_y = attn_output_57_transpose_y_0, x = softmax_28_cast_fp16, y = value_115_cast_fp16)[name = tensor("attn_output_57_cast_fp16")]; tensor var_1627_perm_0 = const()[name = tensor("op_1627_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1629 = const()[name = tensor("op_1629"), val = tensor([1, 1500, 1280])]; tensor var_1627_cast_fp16 = transpose(perm = var_1627_perm_0, x = attn_output_57_cast_fp16)[name = tensor("transpose_204")]; tensor input_287_cast_fp16 = reshape(shape = var_1629, x = var_1627_cast_fp16)[name = tensor("input_287_cast_fp16")]; tensor encoder_layers_28_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126394496)))]; tensor encoder_layers_28_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_28_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129671360)))]; tensor linear_171_cast_fp16 = linear(bias = encoder_layers_28_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_28_self_attn_out_proj_weight_to_fp16, x = input_287_cast_fp16)[name = tensor("linear_171_cast_fp16")]; tensor input_289_cast_fp16 = add(x = input_285_cast_fp16, y = linear_171_cast_fp16)[name = tensor("input_289_cast_fp16")]; tensor input_291_axes_0 = const()[name = tensor("input_291_axes_0"), val = tensor([-1])]; tensor encoder_layers_28_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_28_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129673984)))]; tensor encoder_layers_28_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_28_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129676608)))]; tensor input_291_cast_fp16 = layer_norm(axes = input_291_axes_0, beta = encoder_layers_28_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_28_final_layer_norm_weight_to_fp16, x = input_289_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor encoder_layers_28_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_28_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129679232)))]; tensor encoder_layers_28_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_28_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142786496)))]; tensor linear_172_cast_fp16 = linear(bias = encoder_layers_28_fc1_bias_to_fp16, weight = encoder_layers_28_fc1_weight_to_fp16, x = input_291_cast_fp16)[name = tensor("linear_172_cast_fp16")]; tensor input_293_mode_0 = const()[name = tensor("input_293_mode_0"), val = tensor("EXACT")]; tensor input_293_cast_fp16 = gelu(mode = input_293_mode_0, x = linear_172_cast_fp16)[name = tensor("input_293_cast_fp16")]; tensor encoder_layers_28_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_28_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142796800)))]; tensor encoder_layers_28_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_28_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155904064)))]; tensor linear_173_cast_fp16 = linear(bias = encoder_layers_28_fc2_bias_to_fp16, weight = encoder_layers_28_fc2_weight_to_fp16, x = input_293_cast_fp16)[name = tensor("linear_173_cast_fp16")]; tensor input_295_cast_fp16 = add(x = input_289_cast_fp16, y = linear_173_cast_fp16)[name = tensor("input_295_cast_fp16")]; tensor hidden_states_179_axes_0 = const()[name = tensor("hidden_states_179_axes_0"), val = tensor([-1])]; tensor encoder_layers_29_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155906688)))]; tensor encoder_layers_29_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155909312)))]; tensor hidden_states_179_cast_fp16 = layer_norm(axes = hidden_states_179_axes_0, beta = encoder_layers_29_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_29_self_attn_layer_norm_weight_to_fp16, x = input_295_cast_fp16)[name = tensor("hidden_states_179_cast_fp16")]; tensor encoder_layers_29_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155911936)))]; tensor encoder_layers_29_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1159188800)))]; tensor linear_174_cast_fp16 = linear(bias = encoder_layers_29_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_29_self_attn_q_proj_weight_to_fp16, x = hidden_states_179_cast_fp16)[name = tensor("linear_174_cast_fp16")]; tensor encoder_layers_29_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1159191424)))]; tensor linear_175_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_29_self_attn_k_proj_weight_to_fp16, x = hidden_states_179_cast_fp16)[name = tensor("linear_175_cast_fp16")]; tensor encoder_layers_29_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1162468288)))]; tensor encoder_layers_29_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1165745152)))]; tensor linear_176_cast_fp16 = linear(bias = encoder_layers_29_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_29_self_attn_v_proj_weight_to_fp16, x = hidden_states_179_cast_fp16)[name = tensor("linear_176_cast_fp16")]; tensor var_1670 = const()[name = tensor("op_1670"), val = tensor([1, 1500, 20, 64])]; tensor var_1671_cast_fp16 = reshape(shape = var_1670, x = linear_174_cast_fp16)[name = tensor("op_1671_cast_fp16")]; tensor var_1673 = const()[name = tensor("op_1673"), val = tensor([1, 1500, 20, 64])]; tensor var_1674_cast_fp16 = reshape(shape = var_1673, x = linear_175_cast_fp16)[name = tensor("op_1674_cast_fp16")]; tensor var_1676 = const()[name = tensor("op_1676"), val = tensor([1, 1500, 20, 64])]; tensor var_1677_cast_fp16 = reshape(shape = var_1676, x = linear_176_cast_fp16)[name = tensor("op_1677_cast_fp16")]; tensor value_119_perm_0 = const()[name = tensor("value_119_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_29_cast_fp16 = mul(x = var_1671_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_29_cast_fp16")]; tensor matmul_29_transpose_y_0 = const()[name = tensor("matmul_29_transpose_y_0"), val = tensor(true)]; tensor matmul_29_transpose_x_0 = const()[name = tensor("matmul_29_transpose_x_0"), val = tensor(false)]; tensor transpose_186_perm_0 = const()[name = tensor("transpose_186_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_187_perm_0 = const()[name = tensor("transpose_187_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_187 = transpose(perm = transpose_187_perm_0, x = var_1674_cast_fp16)[name = tensor("transpose_201")]; tensor transpose_186 = transpose(perm = transpose_186_perm_0, x = mul_29_cast_fp16)[name = tensor("transpose_202")]; tensor matmul_29_cast_fp16 = matmul(transpose_x = matmul_29_transpose_x_0, transpose_y = matmul_29_transpose_y_0, x = transpose_186, y = transpose_187)[name = tensor("matmul_29_cast_fp16")]; tensor softmax_29_axis_0 = const()[name = tensor("softmax_29_axis_0"), val = tensor(-1)]; tensor softmax_29_cast_fp16 = softmax(axis = softmax_29_axis_0, x = matmul_29_cast_fp16)[name = tensor("softmax_29_cast_fp16")]; tensor attn_output_59_transpose_x_0 = const()[name = tensor("attn_output_59_transpose_x_0"), val = tensor(false)]; tensor attn_output_59_transpose_y_0 = const()[name = tensor("attn_output_59_transpose_y_0"), val = tensor(false)]; tensor value_119_cast_fp16 = transpose(perm = value_119_perm_0, x = var_1677_cast_fp16)[name = tensor("transpose_203")]; tensor attn_output_59_cast_fp16 = matmul(transpose_x = attn_output_59_transpose_x_0, transpose_y = attn_output_59_transpose_y_0, x = softmax_29_cast_fp16, y = value_119_cast_fp16)[name = tensor("attn_output_59_cast_fp16")]; tensor var_1680_perm_0 = const()[name = tensor("op_1680_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1682 = const()[name = tensor("op_1682"), val = tensor([1, 1500, 1280])]; tensor var_1680_cast_fp16 = transpose(perm = var_1680_perm_0, x = attn_output_59_cast_fp16)[name = tensor("transpose_200")]; tensor input_297_cast_fp16 = reshape(shape = var_1682, x = var_1680_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor encoder_layers_29_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1165747776)))]; tensor encoder_layers_29_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_29_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169024640)))]; tensor linear_177_cast_fp16 = linear(bias = encoder_layers_29_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_29_self_attn_out_proj_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("linear_177_cast_fp16")]; tensor input_299_cast_fp16 = add(x = input_295_cast_fp16, y = linear_177_cast_fp16)[name = tensor("input_299_cast_fp16")]; tensor input_301_axes_0 = const()[name = tensor("input_301_axes_0"), val = tensor([-1])]; tensor encoder_layers_29_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_29_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169027264)))]; tensor encoder_layers_29_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_29_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169029888)))]; tensor input_301_cast_fp16 = layer_norm(axes = input_301_axes_0, beta = encoder_layers_29_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_29_final_layer_norm_weight_to_fp16, x = input_299_cast_fp16)[name = tensor("input_301_cast_fp16")]; tensor encoder_layers_29_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_29_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169032512)))]; tensor encoder_layers_29_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_29_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1182139776)))]; tensor linear_178_cast_fp16 = linear(bias = encoder_layers_29_fc1_bias_to_fp16, weight = encoder_layers_29_fc1_weight_to_fp16, x = input_301_cast_fp16)[name = tensor("linear_178_cast_fp16")]; tensor input_303_mode_0 = const()[name = tensor("input_303_mode_0"), val = tensor("EXACT")]; tensor input_303_cast_fp16 = gelu(mode = input_303_mode_0, x = linear_178_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor encoder_layers_29_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_29_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1182150080)))]; tensor encoder_layers_29_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_29_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195257344)))]; tensor linear_179_cast_fp16 = linear(bias = encoder_layers_29_fc2_bias_to_fp16, weight = encoder_layers_29_fc2_weight_to_fp16, x = input_303_cast_fp16)[name = tensor("linear_179_cast_fp16")]; tensor input_305_cast_fp16 = add(x = input_299_cast_fp16, y = linear_179_cast_fp16)[name = tensor("input_305_cast_fp16")]; tensor hidden_states_185_axes_0 = const()[name = tensor("hidden_states_185_axes_0"), val = tensor([-1])]; tensor encoder_layers_30_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195259968)))]; tensor encoder_layers_30_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195262592)))]; tensor hidden_states_185_cast_fp16 = layer_norm(axes = hidden_states_185_axes_0, beta = encoder_layers_30_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_30_self_attn_layer_norm_weight_to_fp16, x = input_305_cast_fp16)[name = tensor("hidden_states_185_cast_fp16")]; tensor encoder_layers_30_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195265216)))]; tensor encoder_layers_30_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1198542080)))]; tensor linear_180_cast_fp16 = linear(bias = encoder_layers_30_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_30_self_attn_q_proj_weight_to_fp16, x = hidden_states_185_cast_fp16)[name = tensor("linear_180_cast_fp16")]; tensor encoder_layers_30_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1198544704)))]; tensor linear_181_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_30_self_attn_k_proj_weight_to_fp16, x = hidden_states_185_cast_fp16)[name = tensor("linear_181_cast_fp16")]; tensor encoder_layers_30_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1201821568)))]; tensor encoder_layers_30_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205098432)))]; tensor linear_182_cast_fp16 = linear(bias = encoder_layers_30_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_30_self_attn_v_proj_weight_to_fp16, x = hidden_states_185_cast_fp16)[name = tensor("linear_182_cast_fp16")]; tensor var_1723 = const()[name = tensor("op_1723"), val = tensor([1, 1500, 20, 64])]; tensor var_1724_cast_fp16 = reshape(shape = var_1723, x = linear_180_cast_fp16)[name = tensor("op_1724_cast_fp16")]; tensor var_1726 = const()[name = tensor("op_1726"), val = tensor([1, 1500, 20, 64])]; tensor var_1727_cast_fp16 = reshape(shape = var_1726, x = linear_181_cast_fp16)[name = tensor("op_1727_cast_fp16")]; tensor var_1729 = const()[name = tensor("op_1729"), val = tensor([1, 1500, 20, 64])]; tensor var_1730_cast_fp16 = reshape(shape = var_1729, x = linear_182_cast_fp16)[name = tensor("op_1730_cast_fp16")]; tensor value_123_perm_0 = const()[name = tensor("value_123_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_30_cast_fp16 = mul(x = var_1724_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_30_cast_fp16")]; tensor matmul_30_transpose_y_0 = const()[name = tensor("matmul_30_transpose_y_0"), val = tensor(true)]; tensor matmul_30_transpose_x_0 = const()[name = tensor("matmul_30_transpose_x_0"), val = tensor(false)]; tensor transpose_188_perm_0 = const()[name = tensor("transpose_188_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_189_perm_0 = const()[name = tensor("transpose_189_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_189 = transpose(perm = transpose_189_perm_0, x = var_1727_cast_fp16)[name = tensor("transpose_197")]; tensor transpose_188 = transpose(perm = transpose_188_perm_0, x = mul_30_cast_fp16)[name = tensor("transpose_198")]; tensor matmul_30_cast_fp16 = matmul(transpose_x = matmul_30_transpose_x_0, transpose_y = matmul_30_transpose_y_0, x = transpose_188, y = transpose_189)[name = tensor("matmul_30_cast_fp16")]; tensor softmax_30_axis_0 = const()[name = tensor("softmax_30_axis_0"), val = tensor(-1)]; tensor softmax_30_cast_fp16 = softmax(axis = softmax_30_axis_0, x = matmul_30_cast_fp16)[name = tensor("softmax_30_cast_fp16")]; tensor attn_output_61_transpose_x_0 = const()[name = tensor("attn_output_61_transpose_x_0"), val = tensor(false)]; tensor attn_output_61_transpose_y_0 = const()[name = tensor("attn_output_61_transpose_y_0"), val = tensor(false)]; tensor value_123_cast_fp16 = transpose(perm = value_123_perm_0, x = var_1730_cast_fp16)[name = tensor("transpose_199")]; tensor attn_output_61_cast_fp16 = matmul(transpose_x = attn_output_61_transpose_x_0, transpose_y = attn_output_61_transpose_y_0, x = softmax_30_cast_fp16, y = value_123_cast_fp16)[name = tensor("attn_output_61_cast_fp16")]; tensor var_1733_perm_0 = const()[name = tensor("op_1733_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1735 = const()[name = tensor("op_1735"), val = tensor([1, 1500, 1280])]; tensor var_1733_cast_fp16 = transpose(perm = var_1733_perm_0, x = attn_output_61_cast_fp16)[name = tensor("transpose_196")]; tensor input_307_cast_fp16 = reshape(shape = var_1735, x = var_1733_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor encoder_layers_30_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205101056)))]; tensor encoder_layers_30_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_30_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208377920)))]; tensor linear_183_cast_fp16 = linear(bias = encoder_layers_30_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_30_self_attn_out_proj_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("linear_183_cast_fp16")]; tensor input_309_cast_fp16 = add(x = input_305_cast_fp16, y = linear_183_cast_fp16)[name = tensor("input_309_cast_fp16")]; tensor input_311_axes_0 = const()[name = tensor("input_311_axes_0"), val = tensor([-1])]; tensor encoder_layers_30_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_30_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208380544)))]; tensor encoder_layers_30_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_30_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208383168)))]; tensor input_311_cast_fp16 = layer_norm(axes = input_311_axes_0, beta = encoder_layers_30_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_30_final_layer_norm_weight_to_fp16, x = input_309_cast_fp16)[name = tensor("input_311_cast_fp16")]; tensor encoder_layers_30_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_30_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208385792)))]; tensor encoder_layers_30_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_30_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1221493056)))]; tensor linear_184_cast_fp16 = linear(bias = encoder_layers_30_fc1_bias_to_fp16, weight = encoder_layers_30_fc1_weight_to_fp16, x = input_311_cast_fp16)[name = tensor("linear_184_cast_fp16")]; tensor input_313_mode_0 = const()[name = tensor("input_313_mode_0"), val = tensor("EXACT")]; tensor input_313_cast_fp16 = gelu(mode = input_313_mode_0, x = linear_184_cast_fp16)[name = tensor("input_313_cast_fp16")]; tensor encoder_layers_30_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_30_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1221503360)))]; tensor encoder_layers_30_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_30_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234610624)))]; tensor linear_185_cast_fp16 = linear(bias = encoder_layers_30_fc2_bias_to_fp16, weight = encoder_layers_30_fc2_weight_to_fp16, x = input_313_cast_fp16)[name = tensor("linear_185_cast_fp16")]; tensor input_315_cast_fp16 = add(x = input_309_cast_fp16, y = linear_185_cast_fp16)[name = tensor("input_315_cast_fp16")]; tensor hidden_states_191_axes_0 = const()[name = tensor("hidden_states_191_axes_0"), val = tensor([-1])]; tensor encoder_layers_31_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234613248)))]; tensor encoder_layers_31_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234615872)))]; tensor hidden_states_191_cast_fp16 = layer_norm(axes = hidden_states_191_axes_0, beta = encoder_layers_31_self_attn_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_31_self_attn_layer_norm_weight_to_fp16, x = input_315_cast_fp16)[name = tensor("hidden_states_191_cast_fp16")]; tensor encoder_layers_31_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234618496)))]; tensor encoder_layers_31_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237895360)))]; tensor linear_186_cast_fp16 = linear(bias = encoder_layers_31_self_attn_q_proj_bias_to_fp16, weight = encoder_layers_31_self_attn_q_proj_weight_to_fp16, x = hidden_states_191_cast_fp16)[name = tensor("linear_186_cast_fp16")]; tensor encoder_layers_31_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237897984)))]; tensor linear_187_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_31_self_attn_k_proj_weight_to_fp16, x = hidden_states_191_cast_fp16)[name = tensor("linear_187_cast_fp16")]; tensor encoder_layers_31_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1241174848)))]; tensor encoder_layers_31_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1244451712)))]; tensor linear_188_cast_fp16 = linear(bias = encoder_layers_31_self_attn_v_proj_bias_to_fp16, weight = encoder_layers_31_self_attn_v_proj_weight_to_fp16, x = hidden_states_191_cast_fp16)[name = tensor("linear_188_cast_fp16")]; tensor var_1776 = const()[name = tensor("op_1776"), val = tensor([1, 1500, 20, 64])]; tensor var_1777_cast_fp16 = reshape(shape = var_1776, x = linear_186_cast_fp16)[name = tensor("op_1777_cast_fp16")]; tensor var_1779 = const()[name = tensor("op_1779"), val = tensor([1, 1500, 20, 64])]; tensor var_1780_cast_fp16 = reshape(shape = var_1779, x = linear_187_cast_fp16)[name = tensor("op_1780_cast_fp16")]; tensor var_1782 = const()[name = tensor("op_1782"), val = tensor([1, 1500, 20, 64])]; tensor var_1783_cast_fp16 = reshape(shape = var_1782, x = linear_188_cast_fp16)[name = tensor("op_1783_cast_fp16")]; tensor value_perm_0 = const()[name = tensor("value_perm_0"), val = tensor([0, 2, 1, 3])]; tensor mul_31_cast_fp16 = mul(x = var_1777_cast_fp16, y = var_6_to_fp16)[name = tensor("mul_31_cast_fp16")]; tensor matmul_31_transpose_y_0 = const()[name = tensor("matmul_31_transpose_y_0"), val = tensor(true)]; tensor matmul_31_transpose_x_0 = const()[name = tensor("matmul_31_transpose_x_0"), val = tensor(false)]; tensor transpose_190_perm_0 = const()[name = tensor("transpose_190_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_191_perm_0 = const()[name = tensor("transpose_191_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_191 = transpose(perm = transpose_191_perm_0, x = var_1780_cast_fp16)[name = tensor("transpose_193")]; tensor transpose_190 = transpose(perm = transpose_190_perm_0, x = mul_31_cast_fp16)[name = tensor("transpose_194")]; tensor matmul_31_cast_fp16 = matmul(transpose_x = matmul_31_transpose_x_0, transpose_y = matmul_31_transpose_y_0, x = transpose_190, y = transpose_191)[name = tensor("matmul_31_cast_fp16")]; tensor softmax_31_axis_0 = const()[name = tensor("softmax_31_axis_0"), val = tensor(-1)]; tensor softmax_31_cast_fp16 = softmax(axis = softmax_31_axis_0, x = matmul_31_cast_fp16)[name = tensor("softmax_31_cast_fp16")]; tensor attn_output_transpose_x_0 = const()[name = tensor("attn_output_transpose_x_0"), val = tensor(false)]; tensor attn_output_transpose_y_0 = const()[name = tensor("attn_output_transpose_y_0"), val = tensor(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = var_1783_cast_fp16)[name = tensor("transpose_195")]; tensor attn_output_cast_fp16 = matmul(transpose_x = attn_output_transpose_x_0, transpose_y = attn_output_transpose_y_0, x = softmax_31_cast_fp16, y = value_cast_fp16)[name = tensor("attn_output_cast_fp16")]; tensor var_1786_perm_0 = const()[name = tensor("op_1786_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1788 = const()[name = tensor("op_1788"), val = tensor([1, 1500, 1280])]; tensor var_1786_cast_fp16 = transpose(perm = var_1786_perm_0, x = attn_output_cast_fp16)[name = tensor("transpose_192")]; tensor input_317_cast_fp16 = reshape(shape = var_1788, x = var_1786_cast_fp16)[name = tensor("input_317_cast_fp16")]; tensor encoder_layers_31_self_attn_out_proj_weight_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1244454336)))]; tensor encoder_layers_31_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("encoder_layers_31_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247731200)))]; tensor linear_189_cast_fp16 = linear(bias = encoder_layers_31_self_attn_out_proj_bias_to_fp16, weight = encoder_layers_31_self_attn_out_proj_weight_to_fp16, x = input_317_cast_fp16)[name = tensor("linear_189_cast_fp16")]; tensor input_319_cast_fp16 = add(x = input_315_cast_fp16, y = linear_189_cast_fp16)[name = tensor("input_319_cast_fp16")]; tensor input_321_axes_0 = const()[name = tensor("input_321_axes_0"), val = tensor([-1])]; tensor encoder_layers_31_final_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_31_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247733824)))]; tensor encoder_layers_31_final_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_31_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247736448)))]; tensor input_321_cast_fp16 = layer_norm(axes = input_321_axes_0, beta = encoder_layers_31_final_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layers_31_final_layer_norm_weight_to_fp16, x = input_319_cast_fp16)[name = tensor("input_321_cast_fp16")]; tensor encoder_layers_31_fc1_weight_to_fp16 = const()[name = tensor("encoder_layers_31_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247739072)))]; tensor encoder_layers_31_fc1_bias_to_fp16 = const()[name = tensor("encoder_layers_31_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1260846336)))]; tensor linear_190_cast_fp16 = linear(bias = encoder_layers_31_fc1_bias_to_fp16, weight = encoder_layers_31_fc1_weight_to_fp16, x = input_321_cast_fp16)[name = tensor("linear_190_cast_fp16")]; tensor input_323_mode_0 = const()[name = tensor("input_323_mode_0"), val = tensor("EXACT")]; tensor input_323_cast_fp16 = gelu(mode = input_323_mode_0, x = linear_190_cast_fp16)[name = tensor("input_323_cast_fp16")]; tensor encoder_layers_31_fc2_weight_to_fp16 = const()[name = tensor("encoder_layers_31_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1260856640)))]; tensor encoder_layers_31_fc2_bias_to_fp16 = const()[name = tensor("encoder_layers_31_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273963904)))]; tensor linear_191_cast_fp16 = linear(bias = encoder_layers_31_fc2_bias_to_fp16, weight = encoder_layers_31_fc2_weight_to_fp16, x = input_323_cast_fp16)[name = tensor("linear_191_cast_fp16")]; tensor input_325_cast_fp16 = add(x = input_319_cast_fp16, y = linear_191_cast_fp16)[name = tensor("input_325_cast_fp16")]; tensor encoder_output_axes_0 = const()[name = tensor("encoder_output_axes_0"), val = tensor([-1])]; tensor encoder_layer_norm_weight_to_fp16 = const()[name = tensor("encoder_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273966528)))]; tensor encoder_layer_norm_bias_to_fp16 = const()[name = tensor("encoder_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273969152)))]; tensor encoder_output_cast_fp16 = layer_norm(axes = encoder_output_axes_0, beta = encoder_layer_norm_bias_to_fp16, epsilon = var_4_to_fp16, gamma = encoder_layer_norm_weight_to_fp16, x = input_325_cast_fp16)[name = tensor("encoder_output_cast_fp16")]; tensor var_1819 = const()[name = tensor("op_1819"), val = tensor([1, 375, 5120])]; tensor input_327_cast_fp16 = reshape(shape = var_1819, x = encoder_output_cast_fp16)[name = tensor("input_327_cast_fp16")]; tensor projector_linear_1_weight_to_fp16 = const()[name = tensor("projector_linear_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273971776)))]; tensor linear_192_bias_0_to_fp16 = const()[name = tensor("linear_192_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1305429120)))]; tensor linear_192_cast_fp16 = linear(bias = linear_192_bias_0_to_fp16, weight = projector_linear_1_weight_to_fp16, x = input_327_cast_fp16)[name = tensor("linear_192_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = linear_192_cast_fp16)[name = tensor("input_cast_fp16")]; tensor projector_linear_2_weight_to_fp16 = const()[name = tensor("projector_linear_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1305435328)))]; tensor linear_193_cast_fp16 = linear(bias = linear_192_bias_0_to_fp16, weight = projector_linear_2_weight_to_fp16, x = input_cast_fp16)[name = tensor("linear_193_cast_fp16")]; tensor linear_193_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("linear_193_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor audio_embeddings = cast(dtype = linear_193_cast_fp16_to_fp32_dtype_0, x = linear_193_cast_fp16)[name = tensor("cast_131")]; } -> (audio_embeddings); }