program(1.3) [buildInfo = dict({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}})] { func main(tensor input_ids) { int32 inputs_embeds_batch_dims_0 = const()[name = string("inputs_embeds_batch_dims_0"), val = int32(0)]; bool inputs_embeds_validate_indices_0 = const()[name = string("inputs_embeds_validate_indices_0"), val = bool(false)]; tensor encoder_embeddings_token_embedding_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(28459136))))[name = string("encoder_embeddings_token_embedding_weight_to_fp16_palettized")]; int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)]; tensor greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = string("greater_equal_0")]; int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(49408)]; tensor add_12 = add(x = input_ids, y = slice_by_index_0)[name = string("add_12")]; tensor select_0 = select(a = input_ids, b = add_12, cond = greater_equal_0)[name = string("select_0")]; int32 greater_equal_0_y_0_1 = const()[name = string("greater_equal_0_y_0_1"), val = int32(0)]; tensor greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = string("greater_equal_0_1")]; int32 slice_by_index_0_1 = const()[name = string("slice_by_index_0_1"), val = int32(49408)]; tensor add_0 = add(x = select_0, y = slice_by_index_0_1)[name = string("add_0")]; tensor select_0_1 = select(a = select_0, b = add_0, cond = greater_equal_0_1)[name = string("select_0_1")]; int32 inputs_embeds_cast_fp16_axis_0 = const()[name = string("inputs_embeds_cast_fp16_axis_0"), val = int32(0)]; tensor inputs_embeds_cast_fp16 = gather(axis = inputs_embeds_cast_fp16_axis_0, batch_dims = inputs_embeds_batch_dims_0, indices = select_0_1, validate_indices = inputs_embeds_validate_indices_0, x = encoder_embeddings_token_embedding_weight_to_fp16_palettized)[name = string("inputs_embeds_cast_fp16")]; tensor position_embeddings_to_fp16 = const()[name = string("position_embeddings_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(28854464)))]; tensor input_3_cast_fp16 = add(x = inputs_embeds_cast_fp16, y = position_embeddings_to_fp16)[name = string("input_3_cast_fp16")]; tensor hidden_states_1_axes_0 = const()[name = string("hidden_states_1_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_0_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_0_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(28972800)))]; tensor encoder_encoder_layers_0_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(28974400)))]; fp16 var_11_to_fp16 = const()[name = string("op_11_to_fp16"), val = fp16(0x1.5p-17)]; tensor hidden_states_1_cast_fp16 = layer_norm(axes = hidden_states_1_axes_0, beta = encoder_encoder_layers_0_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_0_layer_norm1_weight_to_fp16, x = input_3_cast_fp16)[name = string("hidden_states_1_cast_fp16")]; tensor encoder_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(28976000))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29418432))))[name = string("encoder_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29424640)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_encoder_layers_0_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_0_cast_fp16")]; tensor encoder_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29426240))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29868672))))[name = string("encoder_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29874880)))]; tensor linear_1_cast_fp16 = linear(bias = encoder_encoder_layers_0_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_1_cast_fp16")]; tensor encoder_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(29876480))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30318912))))[name = string("encoder_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30325120)))]; tensor linear_2_cast_fp16 = linear(bias = encoder_encoder_layers_0_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_2_cast_fp16")]; tensor var_82 = const()[name = string("op_82"), val = tensor([1, 77, -1, 64])]; tensor var_83_cast_fp16 = reshape(shape = var_82, x = linear_0_cast_fp16)[name = string("op_83_cast_fp16")]; tensor var_85 = const()[name = string("op_85"), val = tensor([1, 77, -1, 64])]; tensor var_86_cast_fp16 = reshape(shape = var_85, x = linear_1_cast_fp16)[name = string("op_86_cast_fp16")]; tensor var_88 = const()[name = string("op_88"), val = tensor([1, 77, -1, 64])]; tensor var_89_cast_fp16 = reshape(shape = var_88, x = linear_2_cast_fp16)[name = string("op_89_cast_fp16")]; tensor value_1_perm_0 = const()[name = string("value_1_perm_0"), val = tensor([0, 2, -3, -1])]; fp16 var_9_to_fp16 = const()[name = string("op_9_to_fp16"), val = fp16(0x1p-3)]; tensor mul_1_cast_fp16 = mul(x = var_83_cast_fp16, y = var_9_to_fp16)[name = string("mul_1_cast_fp16")]; bool matmul_0_transpose_y_0 = const()[name = string("matmul_0_transpose_y_0"), val = bool(true)]; bool matmul_0_transpose_x_0 = const()[name = string("matmul_0_transpose_x_0"), val = bool(false)]; tensor transpose_48_perm_0 = const()[name = string("transpose_48_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_49_perm_0 = const()[name = string("transpose_49_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_49 = transpose(perm = transpose_49_perm_0, x = var_86_cast_fp16)[name = string("transpose_118")]; tensor transpose_48 = transpose(perm = transpose_48_perm_0, x = mul_1_cast_fp16)[name = string("transpose_119")]; tensor matmul_0_cast_fp16 = matmul(transpose_x = matmul_0_transpose_x_0, transpose_y = matmul_0_transpose_y_0, x = transpose_48, y = transpose_49)[name = string("matmul_0_cast_fp16")]; tensor mul_0_to_fp16 = const()[name = string("mul_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30326720)))]; tensor add_0_cast_fp16 = add(x = matmul_0_cast_fp16, y = mul_0_to_fp16)[name = string("add_0_cast_fp16")]; int32 softmax_0_axis_0 = const()[name = string("softmax_0_axis_0"), val = int32(-1)]; tensor softmax_0_cast_fp16 = softmax(axis = softmax_0_axis_0, x = add_0_cast_fp16)[name = string("softmax_0_cast_fp16")]; bool attn_output_1_transpose_x_0 = const()[name = string("attn_output_1_transpose_x_0"), val = bool(false)]; bool attn_output_1_transpose_y_0 = const()[name = string("attn_output_1_transpose_y_0"), val = bool(false)]; tensor value_1_cast_fp16 = transpose(perm = value_1_perm_0, x = var_89_cast_fp16)[name = string("transpose_117")]; tensor attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = softmax_0_cast_fp16, y = value_1_cast_fp16)[name = string("attn_output_1_cast_fp16")]; tensor var_92_perm_0 = const()[name = string("op_92_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_94 = const()[name = string("op_94"), val = tensor([1, 77, -1])]; tensor var_92_cast_fp16 = transpose(perm = var_92_perm_0, x = attn_output_1_cast_fp16)[name = string("transpose_116")]; tensor var_95_cast_fp16 = reshape(shape = var_94, x = var_92_cast_fp16)[name = string("op_95_cast_fp16")]; tensor encoder_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30338688))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30781120))))[name = string("encoder_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30787328)))]; tensor linear_3_cast_fp16 = linear(bias = encoder_encoder_layers_0_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized, x = var_95_cast_fp16)[name = string("linear_3_cast_fp16")]; tensor input_7_cast_fp16 = add(x = input_3_cast_fp16, y = linear_3_cast_fp16)[name = string("input_7_cast_fp16")]; tensor input_9_axes_0 = const()[name = string("input_9_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_0_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_0_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30788928)))]; tensor encoder_encoder_layers_0_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30790528)))]; tensor input_9_cast_fp16 = layer_norm(axes = input_9_axes_0, beta = encoder_encoder_layers_0_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_0_layer_norm2_weight_to_fp16, x = input_7_cast_fp16)[name = string("input_9_cast_fp16")]; tensor encoder_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(30792128))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(32561664))))[name = string("encoder_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(32586304)))]; tensor linear_4_cast_fp16 = linear(bias = encoder_encoder_layers_0_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized, x = input_9_cast_fp16)[name = string("linear_4_cast_fp16")]; fp16 var_110_to_fp16 = const()[name = string("op_110_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_111_cast_fp16 = mul(x = linear_4_cast_fp16, y = var_110_to_fp16)[name = string("op_111_cast_fp16")]; tensor var_112_cast_fp16 = sigmoid(x = var_111_cast_fp16)[name = string("op_112_cast_fp16")]; tensor input_13_cast_fp16 = mul(x = linear_4_cast_fp16, y = var_112_cast_fp16)[name = string("input_13_cast_fp16")]; tensor encoder_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(32592512))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34362048))))[name = string("encoder_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_0_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_0_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34368256)))]; tensor linear_5_cast_fp16 = linear(bias = encoder_encoder_layers_0_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized, x = input_13_cast_fp16)[name = string("linear_5_cast_fp16")]; tensor input_15_cast_fp16 = add(x = input_7_cast_fp16, y = linear_5_cast_fp16)[name = string("input_15_cast_fp16")]; tensor hidden_states_7_axes_0 = const()[name = string("hidden_states_7_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_1_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_1_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34369856)))]; tensor encoder_encoder_layers_1_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34371456)))]; tensor hidden_states_7_cast_fp16 = layer_norm(axes = hidden_states_7_axes_0, beta = encoder_encoder_layers_1_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_1_layer_norm1_weight_to_fp16, x = input_15_cast_fp16)[name = string("hidden_states_7_cast_fp16")]; tensor encoder_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34373056))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34815488))))[name = string("encoder_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34821696)))]; tensor linear_6_cast_fp16 = linear(bias = encoder_encoder_layers_1_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_6_cast_fp16")]; tensor encoder_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(34823296))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35265728))))[name = string("encoder_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35271936)))]; tensor linear_7_cast_fp16 = linear(bias = encoder_encoder_layers_1_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_7_cast_fp16")]; tensor encoder_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35273536))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35715968))))[name = string("encoder_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35722176)))]; tensor linear_8_cast_fp16 = linear(bias = encoder_encoder_layers_1_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_8_cast_fp16")]; tensor var_141 = const()[name = string("op_141"), val = tensor([1, 77, -1, 64])]; tensor var_142_cast_fp16 = reshape(shape = var_141, x = linear_6_cast_fp16)[name = string("op_142_cast_fp16")]; tensor var_144 = const()[name = string("op_144"), val = tensor([1, 77, -1, 64])]; tensor var_145_cast_fp16 = reshape(shape = var_144, x = linear_7_cast_fp16)[name = string("op_145_cast_fp16")]; tensor var_147 = const()[name = string("op_147"), val = tensor([1, 77, -1, 64])]; tensor var_148_cast_fp16 = reshape(shape = var_147, x = linear_8_cast_fp16)[name = string("op_148_cast_fp16")]; tensor value_3_perm_0 = const()[name = string("value_3_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_3_cast_fp16 = mul(x = var_142_cast_fp16, y = var_9_to_fp16)[name = string("mul_3_cast_fp16")]; bool matmul_1_transpose_y_0 = const()[name = string("matmul_1_transpose_y_0"), val = bool(true)]; bool matmul_1_transpose_x_0 = const()[name = string("matmul_1_transpose_x_0"), val = bool(false)]; tensor transpose_50_perm_0 = const()[name = string("transpose_50_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_51_perm_0 = const()[name = string("transpose_51_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_51 = transpose(perm = transpose_51_perm_0, x = var_145_cast_fp16)[name = string("transpose_114")]; tensor transpose_50 = transpose(perm = transpose_50_perm_0, x = mul_3_cast_fp16)[name = string("transpose_115")]; tensor matmul_1_cast_fp16 = matmul(transpose_x = matmul_1_transpose_x_0, transpose_y = matmul_1_transpose_y_0, x = transpose_50, y = transpose_51)[name = string("matmul_1_cast_fp16")]; tensor add_1_cast_fp16 = add(x = matmul_1_cast_fp16, y = mul_0_to_fp16)[name = string("add_1_cast_fp16")]; int32 softmax_1_axis_0 = const()[name = string("softmax_1_axis_0"), val = int32(-1)]; tensor softmax_1_cast_fp16 = softmax(axis = softmax_1_axis_0, x = add_1_cast_fp16)[name = string("softmax_1_cast_fp16")]; bool attn_output_5_transpose_x_0 = const()[name = string("attn_output_5_transpose_x_0"), val = bool(false)]; bool attn_output_5_transpose_y_0 = const()[name = string("attn_output_5_transpose_y_0"), val = bool(false)]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = var_148_cast_fp16)[name = string("transpose_113")]; tensor attn_output_5_cast_fp16 = matmul(transpose_x = attn_output_5_transpose_x_0, transpose_y = attn_output_5_transpose_y_0, x = softmax_1_cast_fp16, y = value_3_cast_fp16)[name = string("attn_output_5_cast_fp16")]; tensor var_151_perm_0 = const()[name = string("op_151_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_153 = const()[name = string("op_153"), val = tensor([1, 77, -1])]; tensor var_151_cast_fp16 = transpose(perm = var_151_perm_0, x = attn_output_5_cast_fp16)[name = string("transpose_112")]; tensor var_154_cast_fp16 = reshape(shape = var_153, x = var_151_cast_fp16)[name = string("op_154_cast_fp16")]; tensor encoder_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35723776))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(36166208))))[name = string("encoder_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(36172416)))]; tensor linear_9_cast_fp16 = linear(bias = encoder_encoder_layers_1_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized, x = var_154_cast_fp16)[name = string("linear_9_cast_fp16")]; tensor input_19_cast_fp16 = add(x = input_15_cast_fp16, y = linear_9_cast_fp16)[name = string("input_19_cast_fp16")]; tensor input_21_axes_0 = const()[name = string("input_21_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_1_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_1_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(36174016)))]; tensor encoder_encoder_layers_1_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(36175616)))]; tensor input_21_cast_fp16 = layer_norm(axes = input_21_axes_0, beta = encoder_encoder_layers_1_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_1_layer_norm2_weight_to_fp16, x = input_19_cast_fp16)[name = string("input_21_cast_fp16")]; tensor encoder_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(36177216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(37946752))))[name = string("encoder_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(37971392)))]; tensor linear_10_cast_fp16 = linear(bias = encoder_encoder_layers_1_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized, x = input_21_cast_fp16)[name = string("linear_10_cast_fp16")]; fp16 var_169_to_fp16 = const()[name = string("op_169_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_170_cast_fp16 = mul(x = linear_10_cast_fp16, y = var_169_to_fp16)[name = string("op_170_cast_fp16")]; tensor var_171_cast_fp16 = sigmoid(x = var_170_cast_fp16)[name = string("op_171_cast_fp16")]; tensor input_25_cast_fp16 = mul(x = linear_10_cast_fp16, y = var_171_cast_fp16)[name = string("input_25_cast_fp16")]; tensor encoder_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(37977600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39747136))))[name = string("encoder_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_1_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_1_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39753344)))]; tensor linear_11_cast_fp16 = linear(bias = encoder_encoder_layers_1_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = string("linear_11_cast_fp16")]; tensor input_27_cast_fp16 = add(x = input_19_cast_fp16, y = linear_11_cast_fp16)[name = string("input_27_cast_fp16")]; tensor hidden_states_13_axes_0 = const()[name = string("hidden_states_13_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_2_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_2_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39754944)))]; tensor encoder_encoder_layers_2_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39756544)))]; tensor hidden_states_13_cast_fp16 = layer_norm(axes = hidden_states_13_axes_0, beta = encoder_encoder_layers_2_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_2_layer_norm1_weight_to_fp16, x = input_27_cast_fp16)[name = string("hidden_states_13_cast_fp16")]; tensor encoder_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39758144))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40200576))))[name = string("encoder_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40206784)))]; tensor linear_12_cast_fp16 = linear(bias = encoder_encoder_layers_2_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_12_cast_fp16")]; tensor encoder_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40208384))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40650816))))[name = string("encoder_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40657024)))]; tensor linear_13_cast_fp16 = linear(bias = encoder_encoder_layers_2_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_13_cast_fp16")]; tensor encoder_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(40658624))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41101056))))[name = string("encoder_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41107264)))]; tensor linear_14_cast_fp16 = linear(bias = encoder_encoder_layers_2_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_14_cast_fp16")]; tensor var_200 = const()[name = string("op_200"), val = tensor([1, 77, -1, 64])]; tensor var_201_cast_fp16 = reshape(shape = var_200, x = linear_12_cast_fp16)[name = string("op_201_cast_fp16")]; tensor var_203 = const()[name = string("op_203"), val = tensor([1, 77, -1, 64])]; tensor var_204_cast_fp16 = reshape(shape = var_203, x = linear_13_cast_fp16)[name = string("op_204_cast_fp16")]; tensor var_206 = const()[name = string("op_206"), val = tensor([1, 77, -1, 64])]; tensor var_207_cast_fp16 = reshape(shape = var_206, x = linear_14_cast_fp16)[name = string("op_207_cast_fp16")]; tensor value_5_perm_0 = const()[name = string("value_5_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_5_cast_fp16 = mul(x = var_201_cast_fp16, y = var_9_to_fp16)[name = string("mul_5_cast_fp16")]; bool matmul_2_transpose_y_0 = const()[name = string("matmul_2_transpose_y_0"), val = bool(true)]; bool matmul_2_transpose_x_0 = const()[name = string("matmul_2_transpose_x_0"), val = bool(false)]; tensor transpose_52_perm_0 = const()[name = string("transpose_52_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_53_perm_0 = const()[name = string("transpose_53_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_53 = transpose(perm = transpose_53_perm_0, x = var_204_cast_fp16)[name = string("transpose_110")]; tensor transpose_52 = transpose(perm = transpose_52_perm_0, x = mul_5_cast_fp16)[name = string("transpose_111")]; tensor matmul_2_cast_fp16 = matmul(transpose_x = matmul_2_transpose_x_0, transpose_y = matmul_2_transpose_y_0, x = transpose_52, y = transpose_53)[name = string("matmul_2_cast_fp16")]; tensor add_2_cast_fp16 = add(x = matmul_2_cast_fp16, y = mul_0_to_fp16)[name = string("add_2_cast_fp16")]; int32 softmax_2_axis_0 = const()[name = string("softmax_2_axis_0"), val = int32(-1)]; tensor softmax_2_cast_fp16 = softmax(axis = softmax_2_axis_0, x = add_2_cast_fp16)[name = string("softmax_2_cast_fp16")]; bool attn_output_9_transpose_x_0 = const()[name = string("attn_output_9_transpose_x_0"), val = bool(false)]; bool attn_output_9_transpose_y_0 = const()[name = string("attn_output_9_transpose_y_0"), val = bool(false)]; tensor value_5_cast_fp16 = transpose(perm = value_5_perm_0, x = var_207_cast_fp16)[name = string("transpose_109")]; tensor attn_output_9_cast_fp16 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = softmax_2_cast_fp16, y = value_5_cast_fp16)[name = string("attn_output_9_cast_fp16")]; tensor var_210_perm_0 = const()[name = string("op_210_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_212 = const()[name = string("op_212"), val = tensor([1, 77, -1])]; tensor var_210_cast_fp16 = transpose(perm = var_210_perm_0, x = attn_output_9_cast_fp16)[name = string("transpose_108")]; tensor var_213_cast_fp16 = reshape(shape = var_212, x = var_210_cast_fp16)[name = string("op_213_cast_fp16")]; tensor encoder_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41108864))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41551296))))[name = string("encoder_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41557504)))]; tensor linear_15_cast_fp16 = linear(bias = encoder_encoder_layers_2_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized, x = var_213_cast_fp16)[name = string("linear_15_cast_fp16")]; tensor input_31_cast_fp16 = add(x = input_27_cast_fp16, y = linear_15_cast_fp16)[name = string("input_31_cast_fp16")]; tensor input_33_axes_0 = const()[name = string("input_33_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_2_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_2_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41559104)))]; tensor encoder_encoder_layers_2_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41560704)))]; tensor input_33_cast_fp16 = layer_norm(axes = input_33_axes_0, beta = encoder_encoder_layers_2_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_2_layer_norm2_weight_to_fp16, x = input_31_cast_fp16)[name = string("input_33_cast_fp16")]; tensor encoder_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41562304))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43331840))))[name = string("encoder_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43356480)))]; tensor linear_16_cast_fp16 = linear(bias = encoder_encoder_layers_2_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized, x = input_33_cast_fp16)[name = string("linear_16_cast_fp16")]; fp16 var_228_to_fp16 = const()[name = string("op_228_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_229_cast_fp16 = mul(x = linear_16_cast_fp16, y = var_228_to_fp16)[name = string("op_229_cast_fp16")]; tensor var_230_cast_fp16 = sigmoid(x = var_229_cast_fp16)[name = string("op_230_cast_fp16")]; tensor input_37_cast_fp16 = mul(x = linear_16_cast_fp16, y = var_230_cast_fp16)[name = string("input_37_cast_fp16")]; tensor encoder_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43362688))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45132224))))[name = string("encoder_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_2_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_2_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45138432)))]; tensor linear_17_cast_fp16 = linear(bias = encoder_encoder_layers_2_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized, x = input_37_cast_fp16)[name = string("linear_17_cast_fp16")]; tensor input_39_cast_fp16 = add(x = input_31_cast_fp16, y = linear_17_cast_fp16)[name = string("input_39_cast_fp16")]; tensor hidden_states_19_axes_0 = const()[name = string("hidden_states_19_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_3_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_3_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45140032)))]; tensor encoder_encoder_layers_3_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45141632)))]; tensor hidden_states_19_cast_fp16 = layer_norm(axes = hidden_states_19_axes_0, beta = encoder_encoder_layers_3_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_3_layer_norm1_weight_to_fp16, x = input_39_cast_fp16)[name = string("hidden_states_19_cast_fp16")]; tensor encoder_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45143232))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45585664))))[name = string("encoder_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45591872)))]; tensor linear_18_cast_fp16 = linear(bias = encoder_encoder_layers_3_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_18_cast_fp16")]; tensor encoder_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(45593472))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46035904))))[name = string("encoder_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46042112)))]; tensor linear_19_cast_fp16 = linear(bias = encoder_encoder_layers_3_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_19_cast_fp16")]; tensor encoder_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46043712))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46486144))))[name = string("encoder_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46492352)))]; tensor linear_20_cast_fp16 = linear(bias = encoder_encoder_layers_3_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_20_cast_fp16")]; tensor var_259 = const()[name = string("op_259"), val = tensor([1, 77, -1, 64])]; tensor var_260_cast_fp16 = reshape(shape = var_259, x = linear_18_cast_fp16)[name = string("op_260_cast_fp16")]; tensor var_262 = const()[name = string("op_262"), val = tensor([1, 77, -1, 64])]; tensor var_263_cast_fp16 = reshape(shape = var_262, x = linear_19_cast_fp16)[name = string("op_263_cast_fp16")]; tensor var_265 = const()[name = string("op_265"), val = tensor([1, 77, -1, 64])]; tensor var_266_cast_fp16 = reshape(shape = var_265, x = linear_20_cast_fp16)[name = string("op_266_cast_fp16")]; tensor value_7_perm_0 = const()[name = string("value_7_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_7_cast_fp16 = mul(x = var_260_cast_fp16, y = var_9_to_fp16)[name = string("mul_7_cast_fp16")]; bool matmul_3_transpose_y_0 = const()[name = string("matmul_3_transpose_y_0"), val = bool(true)]; bool matmul_3_transpose_x_0 = const()[name = string("matmul_3_transpose_x_0"), val = bool(false)]; tensor transpose_54_perm_0 = const()[name = string("transpose_54_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_55_perm_0 = const()[name = string("transpose_55_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_55 = transpose(perm = transpose_55_perm_0, x = var_263_cast_fp16)[name = string("transpose_106")]; tensor transpose_54 = transpose(perm = transpose_54_perm_0, x = mul_7_cast_fp16)[name = string("transpose_107")]; tensor matmul_3_cast_fp16 = matmul(transpose_x = matmul_3_transpose_x_0, transpose_y = matmul_3_transpose_y_0, x = transpose_54, y = transpose_55)[name = string("matmul_3_cast_fp16")]; tensor add_3_cast_fp16 = add(x = matmul_3_cast_fp16, y = mul_0_to_fp16)[name = string("add_3_cast_fp16")]; int32 softmax_3_axis_0 = const()[name = string("softmax_3_axis_0"), val = int32(-1)]; tensor softmax_3_cast_fp16 = softmax(axis = softmax_3_axis_0, x = add_3_cast_fp16)[name = string("softmax_3_cast_fp16")]; bool attn_output_13_transpose_x_0 = const()[name = string("attn_output_13_transpose_x_0"), val = bool(false)]; bool attn_output_13_transpose_y_0 = const()[name = string("attn_output_13_transpose_y_0"), val = bool(false)]; tensor value_7_cast_fp16 = transpose(perm = value_7_perm_0, x = var_266_cast_fp16)[name = string("transpose_105")]; tensor attn_output_13_cast_fp16 = matmul(transpose_x = attn_output_13_transpose_x_0, transpose_y = attn_output_13_transpose_y_0, x = softmax_3_cast_fp16, y = value_7_cast_fp16)[name = string("attn_output_13_cast_fp16")]; tensor var_269_perm_0 = const()[name = string("op_269_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_271 = const()[name = string("op_271"), val = tensor([1, 77, -1])]; tensor var_269_cast_fp16 = transpose(perm = var_269_perm_0, x = attn_output_13_cast_fp16)[name = string("transpose_104")]; tensor var_272_cast_fp16 = reshape(shape = var_271, x = var_269_cast_fp16)[name = string("op_272_cast_fp16")]; tensor encoder_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46493952))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46936384))))[name = string("encoder_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46942592)))]; tensor linear_21_cast_fp16 = linear(bias = encoder_encoder_layers_3_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized, x = var_272_cast_fp16)[name = string("linear_21_cast_fp16")]; tensor input_43_cast_fp16 = add(x = input_39_cast_fp16, y = linear_21_cast_fp16)[name = string("input_43_cast_fp16")]; tensor input_45_axes_0 = const()[name = string("input_45_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_3_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_3_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46944192)))]; tensor encoder_encoder_layers_3_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46945792)))]; tensor input_45_cast_fp16 = layer_norm(axes = input_45_axes_0, beta = encoder_encoder_layers_3_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_3_layer_norm2_weight_to_fp16, x = input_43_cast_fp16)[name = string("input_45_cast_fp16")]; tensor encoder_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(46947392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48716928))))[name = string("encoder_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48741568)))]; tensor linear_22_cast_fp16 = linear(bias = encoder_encoder_layers_3_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized, x = input_45_cast_fp16)[name = string("linear_22_cast_fp16")]; fp16 var_287_to_fp16 = const()[name = string("op_287_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_288_cast_fp16 = mul(x = linear_22_cast_fp16, y = var_287_to_fp16)[name = string("op_288_cast_fp16")]; tensor var_289_cast_fp16 = sigmoid(x = var_288_cast_fp16)[name = string("op_289_cast_fp16")]; tensor input_49_cast_fp16 = mul(x = linear_22_cast_fp16, y = var_289_cast_fp16)[name = string("input_49_cast_fp16")]; tensor encoder_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48747776))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50517312))))[name = string("encoder_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_3_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_3_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50523520)))]; tensor linear_23_cast_fp16 = linear(bias = encoder_encoder_layers_3_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized, x = input_49_cast_fp16)[name = string("linear_23_cast_fp16")]; tensor input_51_cast_fp16 = add(x = input_43_cast_fp16, y = linear_23_cast_fp16)[name = string("input_51_cast_fp16")]; tensor hidden_states_25_axes_0 = const()[name = string("hidden_states_25_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_4_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_4_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50525120)))]; tensor encoder_encoder_layers_4_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50526720)))]; tensor hidden_states_25_cast_fp16 = layer_norm(axes = hidden_states_25_axes_0, beta = encoder_encoder_layers_4_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_4_layer_norm1_weight_to_fp16, x = input_51_cast_fp16)[name = string("hidden_states_25_cast_fp16")]; tensor encoder_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50528320))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50970752))))[name = string("encoder_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50976960)))]; tensor linear_24_cast_fp16 = linear(bias = encoder_encoder_layers_4_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_24_cast_fp16")]; tensor encoder_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50978560))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51420992))))[name = string("encoder_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51427200)))]; tensor linear_25_cast_fp16 = linear(bias = encoder_encoder_layers_4_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_25_cast_fp16")]; tensor encoder_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51428800))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51871232))))[name = string("encoder_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51877440)))]; tensor linear_26_cast_fp16 = linear(bias = encoder_encoder_layers_4_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_26_cast_fp16")]; tensor var_318 = const()[name = string("op_318"), val = tensor([1, 77, -1, 64])]; tensor var_319_cast_fp16 = reshape(shape = var_318, x = linear_24_cast_fp16)[name = string("op_319_cast_fp16")]; tensor var_321 = const()[name = string("op_321"), val = tensor([1, 77, -1, 64])]; tensor var_322_cast_fp16 = reshape(shape = var_321, x = linear_25_cast_fp16)[name = string("op_322_cast_fp16")]; tensor var_324 = const()[name = string("op_324"), val = tensor([1, 77, -1, 64])]; tensor var_325_cast_fp16 = reshape(shape = var_324, x = linear_26_cast_fp16)[name = string("op_325_cast_fp16")]; tensor value_9_perm_0 = const()[name = string("value_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_9_cast_fp16 = mul(x = var_319_cast_fp16, y = var_9_to_fp16)[name = string("mul_9_cast_fp16")]; bool matmul_4_transpose_y_0 = const()[name = string("matmul_4_transpose_y_0"), val = bool(true)]; bool matmul_4_transpose_x_0 = const()[name = string("matmul_4_transpose_x_0"), val = bool(false)]; tensor transpose_56_perm_0 = const()[name = string("transpose_56_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_57_perm_0 = const()[name = string("transpose_57_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_57 = transpose(perm = transpose_57_perm_0, x = var_322_cast_fp16)[name = string("transpose_102")]; tensor transpose_56 = transpose(perm = transpose_56_perm_0, x = mul_9_cast_fp16)[name = string("transpose_103")]; tensor matmul_4_cast_fp16 = matmul(transpose_x = matmul_4_transpose_x_0, transpose_y = matmul_4_transpose_y_0, x = transpose_56, y = transpose_57)[name = string("matmul_4_cast_fp16")]; tensor add_4_cast_fp16 = add(x = matmul_4_cast_fp16, y = mul_0_to_fp16)[name = string("add_4_cast_fp16")]; int32 softmax_4_axis_0 = const()[name = string("softmax_4_axis_0"), val = int32(-1)]; tensor softmax_4_cast_fp16 = softmax(axis = softmax_4_axis_0, x = add_4_cast_fp16)[name = string("softmax_4_cast_fp16")]; bool attn_output_17_transpose_x_0 = const()[name = string("attn_output_17_transpose_x_0"), val = bool(false)]; bool attn_output_17_transpose_y_0 = const()[name = string("attn_output_17_transpose_y_0"), val = bool(false)]; tensor value_9_cast_fp16 = transpose(perm = value_9_perm_0, x = var_325_cast_fp16)[name = string("transpose_101")]; tensor attn_output_17_cast_fp16 = matmul(transpose_x = attn_output_17_transpose_x_0, transpose_y = attn_output_17_transpose_y_0, x = softmax_4_cast_fp16, y = value_9_cast_fp16)[name = string("attn_output_17_cast_fp16")]; tensor var_328_perm_0 = const()[name = string("op_328_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_330 = const()[name = string("op_330"), val = tensor([1, 77, -1])]; tensor var_328_cast_fp16 = transpose(perm = var_328_perm_0, x = attn_output_17_cast_fp16)[name = string("transpose_100")]; tensor var_331_cast_fp16 = reshape(shape = var_330, x = var_328_cast_fp16)[name = string("op_331_cast_fp16")]; tensor encoder_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51879040))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52321472))))[name = string("encoder_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52327680)))]; tensor linear_27_cast_fp16 = linear(bias = encoder_encoder_layers_4_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized, x = var_331_cast_fp16)[name = string("linear_27_cast_fp16")]; tensor input_55_cast_fp16 = add(x = input_51_cast_fp16, y = linear_27_cast_fp16)[name = string("input_55_cast_fp16")]; tensor input_57_axes_0 = const()[name = string("input_57_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_4_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_4_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52329280)))]; tensor encoder_encoder_layers_4_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52330880)))]; tensor input_57_cast_fp16 = layer_norm(axes = input_57_axes_0, beta = encoder_encoder_layers_4_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_4_layer_norm2_weight_to_fp16, x = input_55_cast_fp16)[name = string("input_57_cast_fp16")]; tensor encoder_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52332480))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(54102016))))[name = string("encoder_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(54126656)))]; tensor linear_28_cast_fp16 = linear(bias = encoder_encoder_layers_4_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized, x = input_57_cast_fp16)[name = string("linear_28_cast_fp16")]; fp16 var_346_to_fp16 = const()[name = string("op_346_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_347_cast_fp16 = mul(x = linear_28_cast_fp16, y = var_346_to_fp16)[name = string("op_347_cast_fp16")]; tensor var_348_cast_fp16 = sigmoid(x = var_347_cast_fp16)[name = string("op_348_cast_fp16")]; tensor input_61_cast_fp16 = mul(x = linear_28_cast_fp16, y = var_348_cast_fp16)[name = string("input_61_cast_fp16")]; tensor encoder_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(54132864))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(55902400))))[name = string("encoder_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_4_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_4_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(55908608)))]; tensor linear_29_cast_fp16 = linear(bias = encoder_encoder_layers_4_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized, x = input_61_cast_fp16)[name = string("linear_29_cast_fp16")]; tensor input_63_cast_fp16 = add(x = input_55_cast_fp16, y = linear_29_cast_fp16)[name = string("input_63_cast_fp16")]; tensor hidden_states_31_axes_0 = const()[name = string("hidden_states_31_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_5_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_5_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(55910208)))]; tensor encoder_encoder_layers_5_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(55911808)))]; tensor hidden_states_31_cast_fp16 = layer_norm(axes = hidden_states_31_axes_0, beta = encoder_encoder_layers_5_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_5_layer_norm1_weight_to_fp16, x = input_63_cast_fp16)[name = string("hidden_states_31_cast_fp16")]; tensor encoder_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(55913408))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56355840))))[name = string("encoder_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56362048)))]; tensor linear_30_cast_fp16 = linear(bias = encoder_encoder_layers_5_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_30_cast_fp16")]; tensor encoder_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56363648))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56806080))))[name = string("encoder_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56812288)))]; tensor linear_31_cast_fp16 = linear(bias = encoder_encoder_layers_5_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_31_cast_fp16")]; tensor encoder_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(56813888))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57256320))))[name = string("encoder_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57262528)))]; tensor linear_32_cast_fp16 = linear(bias = encoder_encoder_layers_5_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_32_cast_fp16")]; tensor var_377 = const()[name = string("op_377"), val = tensor([1, 77, -1, 64])]; tensor var_378_cast_fp16 = reshape(shape = var_377, x = linear_30_cast_fp16)[name = string("op_378_cast_fp16")]; tensor var_380 = const()[name = string("op_380"), val = tensor([1, 77, -1, 64])]; tensor var_381_cast_fp16 = reshape(shape = var_380, x = linear_31_cast_fp16)[name = string("op_381_cast_fp16")]; tensor var_383 = const()[name = string("op_383"), val = tensor([1, 77, -1, 64])]; tensor var_384_cast_fp16 = reshape(shape = var_383, x = linear_32_cast_fp16)[name = string("op_384_cast_fp16")]; tensor value_11_perm_0 = const()[name = string("value_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_11_cast_fp16 = mul(x = var_378_cast_fp16, y = var_9_to_fp16)[name = string("mul_11_cast_fp16")]; bool matmul_5_transpose_y_0 = const()[name = string("matmul_5_transpose_y_0"), val = bool(true)]; bool matmul_5_transpose_x_0 = const()[name = string("matmul_5_transpose_x_0"), val = bool(false)]; tensor transpose_58_perm_0 = const()[name = string("transpose_58_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_59_perm_0 = const()[name = string("transpose_59_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_59 = transpose(perm = transpose_59_perm_0, x = var_381_cast_fp16)[name = string("transpose_98")]; tensor transpose_58 = transpose(perm = transpose_58_perm_0, x = mul_11_cast_fp16)[name = string("transpose_99")]; tensor matmul_5_cast_fp16 = matmul(transpose_x = matmul_5_transpose_x_0, transpose_y = matmul_5_transpose_y_0, x = transpose_58, y = transpose_59)[name = string("matmul_5_cast_fp16")]; tensor add_5_cast_fp16 = add(x = matmul_5_cast_fp16, y = mul_0_to_fp16)[name = string("add_5_cast_fp16")]; int32 softmax_5_axis_0 = const()[name = string("softmax_5_axis_0"), val = int32(-1)]; tensor softmax_5_cast_fp16 = softmax(axis = softmax_5_axis_0, x = add_5_cast_fp16)[name = string("softmax_5_cast_fp16")]; bool attn_output_21_transpose_x_0 = const()[name = string("attn_output_21_transpose_x_0"), val = bool(false)]; bool attn_output_21_transpose_y_0 = const()[name = string("attn_output_21_transpose_y_0"), val = bool(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = var_384_cast_fp16)[name = string("transpose_97")]; tensor attn_output_21_cast_fp16 = matmul(transpose_x = attn_output_21_transpose_x_0, transpose_y = attn_output_21_transpose_y_0, x = softmax_5_cast_fp16, y = value_11_cast_fp16)[name = string("attn_output_21_cast_fp16")]; tensor var_387_perm_0 = const()[name = string("op_387_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_389 = const()[name = string("op_389"), val = tensor([1, 77, -1])]; tensor var_387_cast_fp16 = transpose(perm = var_387_perm_0, x = attn_output_21_cast_fp16)[name = string("transpose_96")]; tensor var_390_cast_fp16 = reshape(shape = var_389, x = var_387_cast_fp16)[name = string("op_390_cast_fp16")]; tensor encoder_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57264128))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57706560))))[name = string("encoder_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57712768)))]; tensor linear_33_cast_fp16 = linear(bias = encoder_encoder_layers_5_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized, x = var_390_cast_fp16)[name = string("linear_33_cast_fp16")]; tensor input_67_cast_fp16 = add(x = input_63_cast_fp16, y = linear_33_cast_fp16)[name = string("input_67_cast_fp16")]; tensor input_69_axes_0 = const()[name = string("input_69_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_5_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_5_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57714368)))]; tensor encoder_encoder_layers_5_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57715968)))]; tensor input_69_cast_fp16 = layer_norm(axes = input_69_axes_0, beta = encoder_encoder_layers_5_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_5_layer_norm2_weight_to_fp16, x = input_67_cast_fp16)[name = string("input_69_cast_fp16")]; tensor encoder_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57717568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(59487104))))[name = string("encoder_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(59511744)))]; tensor linear_34_cast_fp16 = linear(bias = encoder_encoder_layers_5_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized, x = input_69_cast_fp16)[name = string("linear_34_cast_fp16")]; fp16 var_405_to_fp16 = const()[name = string("op_405_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_406_cast_fp16 = mul(x = linear_34_cast_fp16, y = var_405_to_fp16)[name = string("op_406_cast_fp16")]; tensor var_407_cast_fp16 = sigmoid(x = var_406_cast_fp16)[name = string("op_407_cast_fp16")]; tensor input_73_cast_fp16 = mul(x = linear_34_cast_fp16, y = var_407_cast_fp16)[name = string("input_73_cast_fp16")]; tensor encoder_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(59517952))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61287488))))[name = string("encoder_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_5_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_5_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61293696)))]; tensor linear_35_cast_fp16 = linear(bias = encoder_encoder_layers_5_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized, x = input_73_cast_fp16)[name = string("linear_35_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_67_cast_fp16, y = linear_35_cast_fp16)[name = string("input_75_cast_fp16")]; tensor hidden_states_37_axes_0 = const()[name = string("hidden_states_37_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_6_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_6_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61295296)))]; tensor encoder_encoder_layers_6_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61296896)))]; tensor hidden_states_37_cast_fp16 = layer_norm(axes = hidden_states_37_axes_0, beta = encoder_encoder_layers_6_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_6_layer_norm1_weight_to_fp16, x = input_75_cast_fp16)[name = string("hidden_states_37_cast_fp16")]; tensor encoder_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61298496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61740928))))[name = string("encoder_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61747136)))]; tensor linear_36_cast_fp16 = linear(bias = encoder_encoder_layers_6_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_36_cast_fp16")]; tensor encoder_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(61748736))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62191168))))[name = string("encoder_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62197376)))]; tensor linear_37_cast_fp16 = linear(bias = encoder_encoder_layers_6_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_37_cast_fp16")]; tensor encoder_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62198976))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62641408))))[name = string("encoder_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62647616)))]; tensor linear_38_cast_fp16 = linear(bias = encoder_encoder_layers_6_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_38_cast_fp16")]; tensor var_436 = const()[name = string("op_436"), val = tensor([1, 77, -1, 64])]; tensor var_437_cast_fp16 = reshape(shape = var_436, x = linear_36_cast_fp16)[name = string("op_437_cast_fp16")]; tensor var_439 = const()[name = string("op_439"), val = tensor([1, 77, -1, 64])]; tensor var_440_cast_fp16 = reshape(shape = var_439, x = linear_37_cast_fp16)[name = string("op_440_cast_fp16")]; tensor var_442 = const()[name = string("op_442"), val = tensor([1, 77, -1, 64])]; tensor var_443_cast_fp16 = reshape(shape = var_442, x = linear_38_cast_fp16)[name = string("op_443_cast_fp16")]; tensor value_13_perm_0 = const()[name = string("value_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_13_cast_fp16 = mul(x = var_437_cast_fp16, y = var_9_to_fp16)[name = string("mul_13_cast_fp16")]; bool matmul_6_transpose_y_0 = const()[name = string("matmul_6_transpose_y_0"), val = bool(true)]; bool matmul_6_transpose_x_0 = const()[name = string("matmul_6_transpose_x_0"), val = bool(false)]; tensor transpose_60_perm_0 = const()[name = string("transpose_60_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_61_perm_0 = const()[name = string("transpose_61_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_61 = transpose(perm = transpose_61_perm_0, x = var_440_cast_fp16)[name = string("transpose_94")]; tensor transpose_60 = transpose(perm = transpose_60_perm_0, x = mul_13_cast_fp16)[name = string("transpose_95")]; tensor matmul_6_cast_fp16 = matmul(transpose_x = matmul_6_transpose_x_0, transpose_y = matmul_6_transpose_y_0, x = transpose_60, y = transpose_61)[name = string("matmul_6_cast_fp16")]; tensor add_6_cast_fp16 = add(x = matmul_6_cast_fp16, y = mul_0_to_fp16)[name = string("add_6_cast_fp16")]; int32 softmax_6_axis_0 = const()[name = string("softmax_6_axis_0"), val = int32(-1)]; tensor softmax_6_cast_fp16 = softmax(axis = softmax_6_axis_0, x = add_6_cast_fp16)[name = string("softmax_6_cast_fp16")]; bool attn_output_25_transpose_x_0 = const()[name = string("attn_output_25_transpose_x_0"), val = bool(false)]; bool attn_output_25_transpose_y_0 = const()[name = string("attn_output_25_transpose_y_0"), val = bool(false)]; tensor value_13_cast_fp16 = transpose(perm = value_13_perm_0, x = var_443_cast_fp16)[name = string("transpose_93")]; tensor attn_output_25_cast_fp16 = matmul(transpose_x = attn_output_25_transpose_x_0, transpose_y = attn_output_25_transpose_y_0, x = softmax_6_cast_fp16, y = value_13_cast_fp16)[name = string("attn_output_25_cast_fp16")]; tensor var_446_perm_0 = const()[name = string("op_446_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_448 = const()[name = string("op_448"), val = tensor([1, 77, -1])]; tensor var_446_cast_fp16 = transpose(perm = var_446_perm_0, x = attn_output_25_cast_fp16)[name = string("transpose_92")]; tensor var_449_cast_fp16 = reshape(shape = var_448, x = var_446_cast_fp16)[name = string("op_449_cast_fp16")]; tensor encoder_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62649216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(63091648))))[name = string("encoder_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(63097856)))]; tensor linear_39_cast_fp16 = linear(bias = encoder_encoder_layers_6_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized, x = var_449_cast_fp16)[name = string("linear_39_cast_fp16")]; tensor input_79_cast_fp16 = add(x = input_75_cast_fp16, y = linear_39_cast_fp16)[name = string("input_79_cast_fp16")]; tensor input_81_axes_0 = const()[name = string("input_81_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_6_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_6_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(63099456)))]; tensor encoder_encoder_layers_6_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(63101056)))]; tensor input_81_cast_fp16 = layer_norm(axes = input_81_axes_0, beta = encoder_encoder_layers_6_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_6_layer_norm2_weight_to_fp16, x = input_79_cast_fp16)[name = string("input_81_cast_fp16")]; tensor encoder_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(63102656))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64872192))))[name = string("encoder_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64896832)))]; tensor linear_40_cast_fp16 = linear(bias = encoder_encoder_layers_6_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized, x = input_81_cast_fp16)[name = string("linear_40_cast_fp16")]; fp16 var_464_to_fp16 = const()[name = string("op_464_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_465_cast_fp16 = mul(x = linear_40_cast_fp16, y = var_464_to_fp16)[name = string("op_465_cast_fp16")]; tensor var_466_cast_fp16 = sigmoid(x = var_465_cast_fp16)[name = string("op_466_cast_fp16")]; tensor input_85_cast_fp16 = mul(x = linear_40_cast_fp16, y = var_466_cast_fp16)[name = string("input_85_cast_fp16")]; tensor encoder_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64903040))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66672576))))[name = string("encoder_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_6_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_6_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66678784)))]; tensor linear_41_cast_fp16 = linear(bias = encoder_encoder_layers_6_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized, x = input_85_cast_fp16)[name = string("linear_41_cast_fp16")]; tensor input_87_cast_fp16 = add(x = input_79_cast_fp16, y = linear_41_cast_fp16)[name = string("input_87_cast_fp16")]; tensor hidden_states_43_axes_0 = const()[name = string("hidden_states_43_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_7_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_7_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66680384)))]; tensor encoder_encoder_layers_7_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66681984)))]; tensor hidden_states_43_cast_fp16 = layer_norm(axes = hidden_states_43_axes_0, beta = encoder_encoder_layers_7_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_7_layer_norm1_weight_to_fp16, x = input_87_cast_fp16)[name = string("hidden_states_43_cast_fp16")]; tensor encoder_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66683584))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67126016))))[name = string("encoder_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67132224)))]; tensor linear_42_cast_fp16 = linear(bias = encoder_encoder_layers_7_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_42_cast_fp16")]; tensor encoder_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67133824))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67576256))))[name = string("encoder_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67582464)))]; tensor linear_43_cast_fp16 = linear(bias = encoder_encoder_layers_7_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_43_cast_fp16")]; tensor encoder_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67584064))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68026496))))[name = string("encoder_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68032704)))]; tensor linear_44_cast_fp16 = linear(bias = encoder_encoder_layers_7_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_44_cast_fp16")]; tensor var_495 = const()[name = string("op_495"), val = tensor([1, 77, -1, 64])]; tensor var_496_cast_fp16 = reshape(shape = var_495, x = linear_42_cast_fp16)[name = string("op_496_cast_fp16")]; tensor var_498 = const()[name = string("op_498"), val = tensor([1, 77, -1, 64])]; tensor var_499_cast_fp16 = reshape(shape = var_498, x = linear_43_cast_fp16)[name = string("op_499_cast_fp16")]; tensor var_501 = const()[name = string("op_501"), val = tensor([1, 77, -1, 64])]; tensor var_502_cast_fp16 = reshape(shape = var_501, x = linear_44_cast_fp16)[name = string("op_502_cast_fp16")]; tensor value_15_perm_0 = const()[name = string("value_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_15_cast_fp16 = mul(x = var_496_cast_fp16, y = var_9_to_fp16)[name = string("mul_15_cast_fp16")]; bool matmul_7_transpose_y_0 = const()[name = string("matmul_7_transpose_y_0"), val = bool(true)]; bool matmul_7_transpose_x_0 = const()[name = string("matmul_7_transpose_x_0"), val = bool(false)]; tensor transpose_62_perm_0 = const()[name = string("transpose_62_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_63_perm_0 = const()[name = string("transpose_63_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_63 = transpose(perm = transpose_63_perm_0, x = var_499_cast_fp16)[name = string("transpose_90")]; tensor transpose_62 = transpose(perm = transpose_62_perm_0, x = mul_15_cast_fp16)[name = string("transpose_91")]; tensor matmul_7_cast_fp16 = matmul(transpose_x = matmul_7_transpose_x_0, transpose_y = matmul_7_transpose_y_0, x = transpose_62, y = transpose_63)[name = string("matmul_7_cast_fp16")]; tensor add_7_cast_fp16 = add(x = matmul_7_cast_fp16, y = mul_0_to_fp16)[name = string("add_7_cast_fp16")]; int32 softmax_7_axis_0 = const()[name = string("softmax_7_axis_0"), val = int32(-1)]; tensor softmax_7_cast_fp16 = softmax(axis = softmax_7_axis_0, x = add_7_cast_fp16)[name = string("softmax_7_cast_fp16")]; bool attn_output_29_transpose_x_0 = const()[name = string("attn_output_29_transpose_x_0"), val = bool(false)]; bool attn_output_29_transpose_y_0 = const()[name = string("attn_output_29_transpose_y_0"), val = bool(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = var_502_cast_fp16)[name = string("transpose_89")]; tensor attn_output_29_cast_fp16 = matmul(transpose_x = attn_output_29_transpose_x_0, transpose_y = attn_output_29_transpose_y_0, x = softmax_7_cast_fp16, y = value_15_cast_fp16)[name = string("attn_output_29_cast_fp16")]; tensor var_505_perm_0 = const()[name = string("op_505_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_507 = const()[name = string("op_507"), val = tensor([1, 77, -1])]; tensor var_505_cast_fp16 = transpose(perm = var_505_perm_0, x = attn_output_29_cast_fp16)[name = string("transpose_88")]; tensor var_508_cast_fp16 = reshape(shape = var_507, x = var_505_cast_fp16)[name = string("op_508_cast_fp16")]; tensor encoder_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68034304))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68476736))))[name = string("encoder_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68482944)))]; tensor linear_45_cast_fp16 = linear(bias = encoder_encoder_layers_7_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized, x = var_508_cast_fp16)[name = string("linear_45_cast_fp16")]; tensor input_91_cast_fp16 = add(x = input_87_cast_fp16, y = linear_45_cast_fp16)[name = string("input_91_cast_fp16")]; tensor input_93_axes_0 = const()[name = string("input_93_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_7_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_7_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68484544)))]; tensor encoder_encoder_layers_7_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68486144)))]; tensor input_93_cast_fp16 = layer_norm(axes = input_93_axes_0, beta = encoder_encoder_layers_7_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_7_layer_norm2_weight_to_fp16, x = input_91_cast_fp16)[name = string("input_93_cast_fp16")]; tensor encoder_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68487744))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(70257280))))[name = string("encoder_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(70281920)))]; tensor linear_46_cast_fp16 = linear(bias = encoder_encoder_layers_7_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized, x = input_93_cast_fp16)[name = string("linear_46_cast_fp16")]; fp16 var_523_to_fp16 = const()[name = string("op_523_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_524_cast_fp16 = mul(x = linear_46_cast_fp16, y = var_523_to_fp16)[name = string("op_524_cast_fp16")]; tensor var_525_cast_fp16 = sigmoid(x = var_524_cast_fp16)[name = string("op_525_cast_fp16")]; tensor input_97_cast_fp16 = mul(x = linear_46_cast_fp16, y = var_525_cast_fp16)[name = string("input_97_cast_fp16")]; tensor encoder_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(70288128))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72057664))))[name = string("encoder_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_7_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_7_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72063872)))]; tensor linear_47_cast_fp16 = linear(bias = encoder_encoder_layers_7_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized, x = input_97_cast_fp16)[name = string("linear_47_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_91_cast_fp16, y = linear_47_cast_fp16)[name = string("input_99_cast_fp16")]; tensor hidden_states_49_axes_0 = const()[name = string("hidden_states_49_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_8_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_8_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72065472)))]; tensor encoder_encoder_layers_8_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72067072)))]; tensor hidden_states_49_cast_fp16 = layer_norm(axes = hidden_states_49_axes_0, beta = encoder_encoder_layers_8_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_8_layer_norm1_weight_to_fp16, x = input_99_cast_fp16)[name = string("hidden_states_49_cast_fp16")]; tensor encoder_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72068672))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72511104))))[name = string("encoder_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72517312)))]; tensor linear_48_cast_fp16 = linear(bias = encoder_encoder_layers_8_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_48_cast_fp16")]; tensor encoder_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72518912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72961344))))[name = string("encoder_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72967552)))]; tensor linear_49_cast_fp16 = linear(bias = encoder_encoder_layers_8_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_49_cast_fp16")]; tensor encoder_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72969152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73411584))))[name = string("encoder_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73417792)))]; tensor linear_50_cast_fp16 = linear(bias = encoder_encoder_layers_8_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_50_cast_fp16")]; tensor var_554 = const()[name = string("op_554"), val = tensor([1, 77, -1, 64])]; tensor var_555_cast_fp16 = reshape(shape = var_554, x = linear_48_cast_fp16)[name = string("op_555_cast_fp16")]; tensor var_557 = const()[name = string("op_557"), val = tensor([1, 77, -1, 64])]; tensor var_558_cast_fp16 = reshape(shape = var_557, x = linear_49_cast_fp16)[name = string("op_558_cast_fp16")]; tensor var_560 = const()[name = string("op_560"), val = tensor([1, 77, -1, 64])]; tensor var_561_cast_fp16 = reshape(shape = var_560, x = linear_50_cast_fp16)[name = string("op_561_cast_fp16")]; tensor value_17_perm_0 = const()[name = string("value_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_17_cast_fp16 = mul(x = var_555_cast_fp16, y = var_9_to_fp16)[name = string("mul_17_cast_fp16")]; bool matmul_8_transpose_y_0 = const()[name = string("matmul_8_transpose_y_0"), val = bool(true)]; bool matmul_8_transpose_x_0 = const()[name = string("matmul_8_transpose_x_0"), val = bool(false)]; tensor transpose_64_perm_0 = const()[name = string("transpose_64_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_65_perm_0 = const()[name = string("transpose_65_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_65 = transpose(perm = transpose_65_perm_0, x = var_558_cast_fp16)[name = string("transpose_86")]; tensor transpose_64 = transpose(perm = transpose_64_perm_0, x = mul_17_cast_fp16)[name = string("transpose_87")]; tensor matmul_8_cast_fp16 = matmul(transpose_x = matmul_8_transpose_x_0, transpose_y = matmul_8_transpose_y_0, x = transpose_64, y = transpose_65)[name = string("matmul_8_cast_fp16")]; tensor add_8_cast_fp16 = add(x = matmul_8_cast_fp16, y = mul_0_to_fp16)[name = string("add_8_cast_fp16")]; int32 softmax_8_axis_0 = const()[name = string("softmax_8_axis_0"), val = int32(-1)]; tensor softmax_8_cast_fp16 = softmax(axis = softmax_8_axis_0, x = add_8_cast_fp16)[name = string("softmax_8_cast_fp16")]; bool attn_output_33_transpose_x_0 = const()[name = string("attn_output_33_transpose_x_0"), val = bool(false)]; bool attn_output_33_transpose_y_0 = const()[name = string("attn_output_33_transpose_y_0"), val = bool(false)]; tensor value_17_cast_fp16 = transpose(perm = value_17_perm_0, x = var_561_cast_fp16)[name = string("transpose_85")]; tensor attn_output_33_cast_fp16 = matmul(transpose_x = attn_output_33_transpose_x_0, transpose_y = attn_output_33_transpose_y_0, x = softmax_8_cast_fp16, y = value_17_cast_fp16)[name = string("attn_output_33_cast_fp16")]; tensor var_564_perm_0 = const()[name = string("op_564_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_566 = const()[name = string("op_566"), val = tensor([1, 77, -1])]; tensor var_564_cast_fp16 = transpose(perm = var_564_perm_0, x = attn_output_33_cast_fp16)[name = string("transpose_84")]; tensor var_567_cast_fp16 = reshape(shape = var_566, x = var_564_cast_fp16)[name = string("op_567_cast_fp16")]; tensor encoder_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73419392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73861824))))[name = string("encoder_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73868032)))]; tensor linear_51_cast_fp16 = linear(bias = encoder_encoder_layers_8_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized, x = var_567_cast_fp16)[name = string("linear_51_cast_fp16")]; tensor input_103_cast_fp16 = add(x = input_99_cast_fp16, y = linear_51_cast_fp16)[name = string("input_103_cast_fp16")]; tensor input_105_axes_0 = const()[name = string("input_105_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_8_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_8_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73869632)))]; tensor encoder_encoder_layers_8_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73871232)))]; tensor input_105_cast_fp16 = layer_norm(axes = input_105_axes_0, beta = encoder_encoder_layers_8_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_8_layer_norm2_weight_to_fp16, x = input_103_cast_fp16)[name = string("input_105_cast_fp16")]; tensor encoder_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(73872832))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(75642368))))[name = string("encoder_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(75667008)))]; tensor linear_52_cast_fp16 = linear(bias = encoder_encoder_layers_8_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized, x = input_105_cast_fp16)[name = string("linear_52_cast_fp16")]; fp16 var_582_to_fp16 = const()[name = string("op_582_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_583_cast_fp16 = mul(x = linear_52_cast_fp16, y = var_582_to_fp16)[name = string("op_583_cast_fp16")]; tensor var_584_cast_fp16 = sigmoid(x = var_583_cast_fp16)[name = string("op_584_cast_fp16")]; tensor input_109_cast_fp16 = mul(x = linear_52_cast_fp16, y = var_584_cast_fp16)[name = string("input_109_cast_fp16")]; tensor encoder_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(75673216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77442752))))[name = string("encoder_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_8_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_8_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77448960)))]; tensor linear_53_cast_fp16 = linear(bias = encoder_encoder_layers_8_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized, x = input_109_cast_fp16)[name = string("linear_53_cast_fp16")]; tensor input_111_cast_fp16 = add(x = input_103_cast_fp16, y = linear_53_cast_fp16)[name = string("input_111_cast_fp16")]; tensor hidden_states_55_axes_0 = const()[name = string("hidden_states_55_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_9_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_9_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77450560)))]; tensor encoder_encoder_layers_9_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77452160)))]; tensor hidden_states_55_cast_fp16 = layer_norm(axes = hidden_states_55_axes_0, beta = encoder_encoder_layers_9_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_9_layer_norm1_weight_to_fp16, x = input_111_cast_fp16)[name = string("hidden_states_55_cast_fp16")]; tensor encoder_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77453760))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77896192))))[name = string("encoder_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77902400)))]; tensor linear_54_cast_fp16 = linear(bias = encoder_encoder_layers_9_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_54_cast_fp16")]; tensor encoder_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77904000))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78346432))))[name = string("encoder_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78352640)))]; tensor linear_55_cast_fp16 = linear(bias = encoder_encoder_layers_9_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_55_cast_fp16")]; tensor encoder_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78354240))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78796672))))[name = string("encoder_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78802880)))]; tensor linear_56_cast_fp16 = linear(bias = encoder_encoder_layers_9_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_56_cast_fp16")]; tensor var_613 = const()[name = string("op_613"), val = tensor([1, 77, -1, 64])]; tensor var_614_cast_fp16 = reshape(shape = var_613, x = linear_54_cast_fp16)[name = string("op_614_cast_fp16")]; tensor var_616 = const()[name = string("op_616"), val = tensor([1, 77, -1, 64])]; tensor var_617_cast_fp16 = reshape(shape = var_616, x = linear_55_cast_fp16)[name = string("op_617_cast_fp16")]; tensor var_619 = const()[name = string("op_619"), val = tensor([1, 77, -1, 64])]; tensor var_620_cast_fp16 = reshape(shape = var_619, x = linear_56_cast_fp16)[name = string("op_620_cast_fp16")]; tensor value_19_perm_0 = const()[name = string("value_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_19_cast_fp16 = mul(x = var_614_cast_fp16, y = var_9_to_fp16)[name = string("mul_19_cast_fp16")]; bool matmul_9_transpose_y_0 = const()[name = string("matmul_9_transpose_y_0"), val = bool(true)]; bool matmul_9_transpose_x_0 = const()[name = string("matmul_9_transpose_x_0"), val = bool(false)]; tensor transpose_66_perm_0 = const()[name = string("transpose_66_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_67_perm_0 = const()[name = string("transpose_67_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_67 = transpose(perm = transpose_67_perm_0, x = var_617_cast_fp16)[name = string("transpose_82")]; tensor transpose_66 = transpose(perm = transpose_66_perm_0, x = mul_19_cast_fp16)[name = string("transpose_83")]; tensor matmul_9_cast_fp16 = matmul(transpose_x = matmul_9_transpose_x_0, transpose_y = matmul_9_transpose_y_0, x = transpose_66, y = transpose_67)[name = string("matmul_9_cast_fp16")]; tensor add_9_cast_fp16 = add(x = matmul_9_cast_fp16, y = mul_0_to_fp16)[name = string("add_9_cast_fp16")]; int32 softmax_9_axis_0 = const()[name = string("softmax_9_axis_0"), val = int32(-1)]; tensor softmax_9_cast_fp16 = softmax(axis = softmax_9_axis_0, x = add_9_cast_fp16)[name = string("softmax_9_cast_fp16")]; bool attn_output_37_transpose_x_0 = const()[name = string("attn_output_37_transpose_x_0"), val = bool(false)]; bool attn_output_37_transpose_y_0 = const()[name = string("attn_output_37_transpose_y_0"), val = bool(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = var_620_cast_fp16)[name = string("transpose_81")]; tensor attn_output_37_cast_fp16 = matmul(transpose_x = attn_output_37_transpose_x_0, transpose_y = attn_output_37_transpose_y_0, x = softmax_9_cast_fp16, y = value_19_cast_fp16)[name = string("attn_output_37_cast_fp16")]; tensor var_623_perm_0 = const()[name = string("op_623_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_625 = const()[name = string("op_625"), val = tensor([1, 77, -1])]; tensor var_623_cast_fp16 = transpose(perm = var_623_perm_0, x = attn_output_37_cast_fp16)[name = string("transpose_80")]; tensor var_626_cast_fp16 = reshape(shape = var_625, x = var_623_cast_fp16)[name = string("op_626_cast_fp16")]; tensor encoder_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(78804480))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79246912))))[name = string("encoder_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79253120)))]; tensor linear_57_cast_fp16 = linear(bias = encoder_encoder_layers_9_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized, x = var_626_cast_fp16)[name = string("linear_57_cast_fp16")]; tensor input_115_cast_fp16 = add(x = input_111_cast_fp16, y = linear_57_cast_fp16)[name = string("input_115_cast_fp16")]; tensor input_117_axes_0 = const()[name = string("input_117_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_9_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_9_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79254720)))]; tensor encoder_encoder_layers_9_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79256320)))]; tensor input_117_cast_fp16 = layer_norm(axes = input_117_axes_0, beta = encoder_encoder_layers_9_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_9_layer_norm2_weight_to_fp16, x = input_115_cast_fp16)[name = string("input_117_cast_fp16")]; tensor encoder_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79257920))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81027456))))[name = string("encoder_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81052096)))]; tensor linear_58_cast_fp16 = linear(bias = encoder_encoder_layers_9_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized, x = input_117_cast_fp16)[name = string("linear_58_cast_fp16")]; fp16 var_641_to_fp16 = const()[name = string("op_641_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_642_cast_fp16 = mul(x = linear_58_cast_fp16, y = var_641_to_fp16)[name = string("op_642_cast_fp16")]; tensor var_643_cast_fp16 = sigmoid(x = var_642_cast_fp16)[name = string("op_643_cast_fp16")]; tensor input_121_cast_fp16 = mul(x = linear_58_cast_fp16, y = var_643_cast_fp16)[name = string("input_121_cast_fp16")]; tensor encoder_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81058304))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82827840))))[name = string("encoder_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_9_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_9_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82834048)))]; tensor linear_59_cast_fp16 = linear(bias = encoder_encoder_layers_9_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized, x = input_121_cast_fp16)[name = string("linear_59_cast_fp16")]; tensor input_123_cast_fp16 = add(x = input_115_cast_fp16, y = linear_59_cast_fp16)[name = string("input_123_cast_fp16")]; tensor hidden_states_61_axes_0 = const()[name = string("hidden_states_61_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_10_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_10_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82835648)))]; tensor encoder_encoder_layers_10_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82837248)))]; tensor hidden_states_61_cast_fp16 = layer_norm(axes = hidden_states_61_axes_0, beta = encoder_encoder_layers_10_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_10_layer_norm1_weight_to_fp16, x = input_123_cast_fp16)[name = string("hidden_states_61_cast_fp16")]; tensor encoder_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82838848))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83281280))))[name = string("encoder_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83287488)))]; tensor linear_60_cast_fp16 = linear(bias = encoder_encoder_layers_10_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_60_cast_fp16")]; tensor encoder_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83289088))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83731520))))[name = string("encoder_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83737728)))]; tensor linear_61_cast_fp16 = linear(bias = encoder_encoder_layers_10_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_61_cast_fp16")]; tensor encoder_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(83739328))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84181760))))[name = string("encoder_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84187968)))]; tensor linear_62_cast_fp16 = linear(bias = encoder_encoder_layers_10_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_62_cast_fp16")]; tensor var_672 = const()[name = string("op_672"), val = tensor([1, 77, -1, 64])]; tensor var_673_cast_fp16 = reshape(shape = var_672, x = linear_60_cast_fp16)[name = string("op_673_cast_fp16")]; tensor var_675 = const()[name = string("op_675"), val = tensor([1, 77, -1, 64])]; tensor var_676_cast_fp16 = reshape(shape = var_675, x = linear_61_cast_fp16)[name = string("op_676_cast_fp16")]; tensor var_678 = const()[name = string("op_678"), val = tensor([1, 77, -1, 64])]; tensor var_679_cast_fp16 = reshape(shape = var_678, x = linear_62_cast_fp16)[name = string("op_679_cast_fp16")]; tensor value_21_perm_0 = const()[name = string("value_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_21_cast_fp16 = mul(x = var_673_cast_fp16, y = var_9_to_fp16)[name = string("mul_21_cast_fp16")]; bool matmul_10_transpose_y_0 = const()[name = string("matmul_10_transpose_y_0"), val = bool(true)]; bool matmul_10_transpose_x_0 = const()[name = string("matmul_10_transpose_x_0"), val = bool(false)]; tensor transpose_68_perm_0 = const()[name = string("transpose_68_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_69_perm_0 = const()[name = string("transpose_69_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_69 = transpose(perm = transpose_69_perm_0, x = var_676_cast_fp16)[name = string("transpose_78")]; tensor transpose_68 = transpose(perm = transpose_68_perm_0, x = mul_21_cast_fp16)[name = string("transpose_79")]; tensor matmul_10_cast_fp16 = matmul(transpose_x = matmul_10_transpose_x_0, transpose_y = matmul_10_transpose_y_0, x = transpose_68, y = transpose_69)[name = string("matmul_10_cast_fp16")]; tensor add_10_cast_fp16 = add(x = matmul_10_cast_fp16, y = mul_0_to_fp16)[name = string("add_10_cast_fp16")]; int32 softmax_10_axis_0 = const()[name = string("softmax_10_axis_0"), val = int32(-1)]; tensor softmax_10_cast_fp16 = softmax(axis = softmax_10_axis_0, x = add_10_cast_fp16)[name = string("softmax_10_cast_fp16")]; bool attn_output_41_transpose_x_0 = const()[name = string("attn_output_41_transpose_x_0"), val = bool(false)]; bool attn_output_41_transpose_y_0 = const()[name = string("attn_output_41_transpose_y_0"), val = bool(false)]; tensor value_21_cast_fp16 = transpose(perm = value_21_perm_0, x = var_679_cast_fp16)[name = string("transpose_77")]; tensor attn_output_41_cast_fp16 = matmul(transpose_x = attn_output_41_transpose_x_0, transpose_y = attn_output_41_transpose_y_0, x = softmax_10_cast_fp16, y = value_21_cast_fp16)[name = string("attn_output_41_cast_fp16")]; tensor var_682_perm_0 = const()[name = string("op_682_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_684 = const()[name = string("op_684"), val = tensor([1, 77, -1])]; tensor var_682_cast_fp16 = transpose(perm = var_682_perm_0, x = attn_output_41_cast_fp16)[name = string("transpose_76")]; tensor var_685_cast_fp16 = reshape(shape = var_684, x = var_682_cast_fp16)[name = string("op_685_cast_fp16")]; tensor encoder_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84189568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84632000))))[name = string("encoder_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84638208)))]; tensor linear_63_cast_fp16 = linear(bias = encoder_encoder_layers_10_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized, x = var_685_cast_fp16)[name = string("linear_63_cast_fp16")]; tensor input_127_cast_fp16 = add(x = input_123_cast_fp16, y = linear_63_cast_fp16)[name = string("input_127_cast_fp16")]; tensor input_129_axes_0 = const()[name = string("input_129_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_10_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_10_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84639808)))]; tensor encoder_encoder_layers_10_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84641408)))]; tensor input_129_cast_fp16 = layer_norm(axes = input_129_axes_0, beta = encoder_encoder_layers_10_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_10_layer_norm2_weight_to_fp16, x = input_127_cast_fp16)[name = string("input_129_cast_fp16")]; tensor encoder_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(84643008))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(86412544))))[name = string("encoder_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(86437184)))]; tensor linear_64_cast_fp16 = linear(bias = encoder_encoder_layers_10_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized, x = input_129_cast_fp16)[name = string("linear_64_cast_fp16")]; fp16 var_700_to_fp16 = const()[name = string("op_700_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_701_cast_fp16 = mul(x = linear_64_cast_fp16, y = var_700_to_fp16)[name = string("op_701_cast_fp16")]; tensor var_702_cast_fp16 = sigmoid(x = var_701_cast_fp16)[name = string("op_702_cast_fp16")]; tensor input_133_cast_fp16 = mul(x = linear_64_cast_fp16, y = var_702_cast_fp16)[name = string("input_133_cast_fp16")]; tensor encoder_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(86443392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88212928))))[name = string("encoder_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_10_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_10_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88219136)))]; tensor linear_65_cast_fp16 = linear(bias = encoder_encoder_layers_10_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized, x = input_133_cast_fp16)[name = string("linear_65_cast_fp16")]; tensor input_135_cast_fp16 = add(x = input_127_cast_fp16, y = linear_65_cast_fp16)[name = string("input_135_cast_fp16")]; tensor hidden_states_67_axes_0 = const()[name = string("hidden_states_67_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_11_layer_norm1_weight_to_fp16 = const()[name = string("encoder_encoder_layers_11_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88220736)))]; tensor encoder_encoder_layers_11_layer_norm1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88222336)))]; tensor hidden_states_67_cast_fp16 = layer_norm(axes = hidden_states_67_axes_0, beta = encoder_encoder_layers_11_layer_norm1_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_11_layer_norm1_weight_to_fp16, x = input_135_cast_fp16)[name = string("hidden_states_67_cast_fp16")]; tensor encoder_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88223936))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88666368))))[name = string("encoder_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88672576)))]; tensor linear_66_cast_fp16 = linear(bias = encoder_encoder_layers_11_self_attn_q_proj_bias_to_fp16, weight = encoder_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_66_cast_fp16")]; tensor encoder_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(88674176))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89116608))))[name = string("encoder_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89122816)))]; tensor linear_67_cast_fp16 = linear(bias = encoder_encoder_layers_11_self_attn_k_proj_bias_to_fp16, weight = encoder_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_67_cast_fp16")]; tensor encoder_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89124416))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89566848))))[name = string("encoder_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89573056)))]; tensor linear_68_cast_fp16 = linear(bias = encoder_encoder_layers_11_self_attn_v_proj_bias_to_fp16, weight = encoder_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_68_cast_fp16")]; tensor var_731 = const()[name = string("op_731"), val = tensor([1, 77, -1, 64])]; tensor var_732_cast_fp16 = reshape(shape = var_731, x = linear_66_cast_fp16)[name = string("op_732_cast_fp16")]; tensor var_734 = const()[name = string("op_734"), val = tensor([1, 77, -1, 64])]; tensor var_735_cast_fp16 = reshape(shape = var_734, x = linear_67_cast_fp16)[name = string("op_735_cast_fp16")]; tensor var_737 = const()[name = string("op_737"), val = tensor([1, 77, -1, 64])]; tensor var_738_cast_fp16 = reshape(shape = var_737, x = linear_68_cast_fp16)[name = string("op_738_cast_fp16")]; tensor value_perm_0 = const()[name = string("value_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_23_cast_fp16 = mul(x = var_732_cast_fp16, y = var_9_to_fp16)[name = string("mul_23_cast_fp16")]; bool matmul_11_transpose_y_0 = const()[name = string("matmul_11_transpose_y_0"), val = bool(true)]; bool matmul_11_transpose_x_0 = const()[name = string("matmul_11_transpose_x_0"), val = bool(false)]; tensor transpose_70_perm_0 = const()[name = string("transpose_70_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_71_perm_0 = const()[name = string("transpose_71_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_71 = transpose(perm = transpose_71_perm_0, x = var_735_cast_fp16)[name = string("transpose_74")]; tensor transpose_70 = transpose(perm = transpose_70_perm_0, x = mul_23_cast_fp16)[name = string("transpose_75")]; tensor matmul_11_cast_fp16 = matmul(transpose_x = matmul_11_transpose_x_0, transpose_y = matmul_11_transpose_y_0, x = transpose_70, y = transpose_71)[name = string("matmul_11_cast_fp16")]; tensor add_11_cast_fp16 = add(x = matmul_11_cast_fp16, y = mul_0_to_fp16)[name = string("add_11_cast_fp16")]; int32 softmax_11_axis_0 = const()[name = string("softmax_11_axis_0"), val = int32(-1)]; tensor softmax_11_cast_fp16 = softmax(axis = softmax_11_axis_0, x = add_11_cast_fp16)[name = string("softmax_11_cast_fp16")]; bool attn_output_45_transpose_x_0 = const()[name = string("attn_output_45_transpose_x_0"), val = bool(false)]; bool attn_output_45_transpose_y_0 = const()[name = string("attn_output_45_transpose_y_0"), val = bool(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = var_738_cast_fp16)[name = string("transpose_73")]; tensor attn_output_45_cast_fp16 = matmul(transpose_x = attn_output_45_transpose_x_0, transpose_y = attn_output_45_transpose_y_0, x = softmax_11_cast_fp16, y = value_cast_fp16)[name = string("attn_output_45_cast_fp16")]; tensor var_741_perm_0 = const()[name = string("op_741_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_743 = const()[name = string("op_743"), val = tensor([1, 77, -1])]; tensor var_741_cast_fp16 = transpose(perm = var_741_perm_0, x = attn_output_45_cast_fp16)[name = string("transpose_72")]; tensor var_744_cast_fp16 = reshape(shape = var_743, x = var_741_cast_fp16)[name = string("op_744_cast_fp16")]; tensor encoder_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89574656))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(90017088))))[name = string("encoder_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(90023296)))]; tensor linear_69_cast_fp16 = linear(bias = encoder_encoder_layers_11_self_attn_out_proj_bias_to_fp16, weight = encoder_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized, x = var_744_cast_fp16)[name = string("linear_69_cast_fp16")]; tensor input_139_cast_fp16 = add(x = input_135_cast_fp16, y = linear_69_cast_fp16)[name = string("input_139_cast_fp16")]; tensor input_141_axes_0 = const()[name = string("input_141_axes_0"), val = tensor([-1])]; tensor encoder_encoder_layers_11_layer_norm2_weight_to_fp16 = const()[name = string("encoder_encoder_layers_11_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(90024896)))]; tensor encoder_encoder_layers_11_layer_norm2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(90026496)))]; tensor input_141_cast_fp16 = layer_norm(axes = input_141_axes_0, beta = encoder_encoder_layers_11_layer_norm2_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_encoder_layers_11_layer_norm2_weight_to_fp16, x = input_139_cast_fp16)[name = string("input_141_cast_fp16")]; tensor encoder_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(90028096))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(91797632))))[name = string("encoder_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(91822272)))]; tensor linear_70_cast_fp16 = linear(bias = encoder_encoder_layers_11_mlp_fc1_bias_to_fp16, weight = encoder_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized, x = input_141_cast_fp16)[name = string("linear_70_cast_fp16")]; fp16 var_759_to_fp16 = const()[name = string("op_759_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_760_cast_fp16 = mul(x = linear_70_cast_fp16, y = var_759_to_fp16)[name = string("op_760_cast_fp16")]; tensor var_761_cast_fp16 = sigmoid(x = var_760_cast_fp16)[name = string("op_761_cast_fp16")]; tensor input_145_cast_fp16 = mul(x = linear_70_cast_fp16, y = var_761_cast_fp16)[name = string("input_145_cast_fp16")]; tensor encoder_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(91828480))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93598016))))[name = string("encoder_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_encoder_layers_11_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_encoder_layers_11_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93604224)))]; tensor linear_71_cast_fp16 = linear(bias = encoder_encoder_layers_11_mlp_fc2_bias_to_fp16, weight = encoder_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized, x = input_145_cast_fp16)[name = string("linear_71_cast_fp16")]; tensor input_cast_fp16 = add(x = input_139_cast_fp16, y = linear_71_cast_fp16)[name = string("input_cast_fp16")]; tensor last_hidden_state_axes_0 = const()[name = string("last_hidden_state_axes_0"), val = tensor([-1])]; tensor encoder_final_layer_norm_weight_to_fp16 = const()[name = string("encoder_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93605824)))]; tensor encoder_final_layer_norm_bias_to_fp16 = const()[name = string("encoder_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93607424)))]; tensor hidden_embeds = layer_norm(axes = last_hidden_state_axes_0, beta = encoder_final_layer_norm_bias_to_fp16, epsilon = var_11_to_fp16, gamma = encoder_final_layer_norm_weight_to_fp16, x = input_cast_fp16)[name = string("last_hidden_state_cast_fp16")]; tensor var_772 = const()[name = string("op_772"), val = tensor([0])]; int32 var_774_axis_0 = const()[name = string("op_774_axis_0"), val = int32(-1)]; bool var_774_keep_dims_0 = const()[name = string("op_774_keep_dims_0"), val = bool(false)]; string var_774_output_dtype_0 = const()[name = string("op_774_output_dtype_0"), val = string("int32")]; tensor var_774 = reduce_argmax(axis = var_774_axis_0, keep_dims = var_774_keep_dims_0, output_dtype = var_774_output_dtype_0, x = input_ids)[name = string("op_774")]; int32 stack_0_axis_0 = const()[name = string("stack_0_axis_0"), val = int32(1)]; tensor stack_0 = stack(axis = stack_0_axis_0, values = (var_772, var_774))[name = string("stack_0")]; int32 var_776_transpose_batch_dims_0 = const()[name = string("op_776_transpose_batch_dims_0"), val = int32(0)]; bool var_776_transpose_validate_indices_0 = const()[name = string("op_776_transpose_validate_indices_0"), val = bool(false)]; string stack_0_to_uint16_dtype_0 = const()[name = string("stack_0_to_uint16_dtype_0"), val = string("uint16")]; tensor stack_0_to_uint16 = cast(dtype = stack_0_to_uint16_dtype_0, x = stack_0)[name = string("cast_0")]; tensor pooled_outputs = gather_nd(batch_dims = var_776_transpose_batch_dims_0, indices = stack_0_to_uint16, validate_indices = var_776_transpose_validate_indices_0, x = hidden_embeds)[name = string("op_776_transpose_cast_fp16_cast_uint16")]; } -> (hidden_embeds, pooled_outputs); }