program(1.3) [buildInfo = dict({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}})] { func main(tensor input_ids) { int32 inputs_embeds_batch_dims_0 = const()[name = string("inputs_embeds_batch_dims_0"), val = int32(0)]; bool inputs_embeds_validate_indices_0 = const()[name = string("inputs_embeds_validate_indices_0"), val = bool(false)]; tensor encoder_text_model_embeddings_token_embedding_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(47431808))))[name = string("encoder_text_model_embeddings_token_embedding_weight_to_fp16_palettized")]; int32 greater_equal_0_y_0 = const()[name = string("greater_equal_0_y_0"), val = int32(0)]; tensor greater_equal_0 = greater_equal(x = input_ids, y = greater_equal_0_y_0)[name = string("greater_equal_0")]; int32 slice_by_index_0 = const()[name = string("slice_by_index_0"), val = int32(49408)]; tensor add_32 = add(x = input_ids, y = slice_by_index_0)[name = string("add_32")]; tensor select_0 = select(a = input_ids, b = add_32, cond = greater_equal_0)[name = string("select_0")]; int32 greater_equal_0_y_0_1 = const()[name = string("greater_equal_0_y_0_1"), val = int32(0)]; tensor greater_equal_0_1 = greater_equal(x = select_0, y = greater_equal_0_y_0_1)[name = string("greater_equal_0_1")]; int32 slice_by_index_0_1 = const()[name = string("slice_by_index_0_1"), val = int32(49408)]; tensor add_0 = add(x = select_0, y = slice_by_index_0_1)[name = string("add_0")]; tensor select_0_1 = select(a = select_0, b = add_0, cond = greater_equal_0_1)[name = string("select_0_1")]; int32 inputs_embeds_cast_fp16_axis_0 = const()[name = string("inputs_embeds_cast_fp16_axis_0"), val = int32(0)]; tensor inputs_embeds_cast_fp16 = gather(axis = inputs_embeds_cast_fp16_axis_0, batch_dims = inputs_embeds_batch_dims_0, indices = select_0_1, validate_indices = inputs_embeds_validate_indices_0, x = encoder_text_model_embeddings_token_embedding_weight_to_fp16_palettized)[name = string("inputs_embeds_cast_fp16")]; tensor position_embeddings_to_fp16 = const()[name = string("position_embeddings_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(47827136)))]; tensor input_3_cast_fp16 = add(x = inputs_embeds_cast_fp16, y = position_embeddings_to_fp16)[name = string("input_3_cast_fp16")]; tensor hidden_states_1_axes_0 = const()[name = string("hidden_states_1_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_0_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48024320)))]; tensor encoder_text_model_encoder_layers_0_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48026944)))]; fp16 var_9_to_fp16 = const()[name = string("op_9_to_fp16"), val = fp16(0x1.5p-17)]; tensor hidden_states_1_cast_fp16 = layer_norm(axes = hidden_states_1_axes_0, beta = encoder_text_model_encoder_layers_0_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_0_layer_norm1_weight_to_fp16, x = input_3_cast_fp16)[name = string("hidden_states_1_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(48029568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(49258432))))[name = string("encoder_text_model_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(49268736)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_0_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(49271360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50500224))))[name = string("encoder_text_model_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50510528)))]; tensor linear_1_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_1_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(50513152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51742016))))[name = string("encoder_text_model_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51752320)))]; tensor linear_2_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = string("linear_2_cast_fp16")]; tensor var_125 = const()[name = string("op_125"), val = tensor([1, 77, -1, 64])]; tensor var_126_cast_fp16 = reshape(shape = var_125, x = linear_0_cast_fp16)[name = string("op_126_cast_fp16")]; tensor var_128 = const()[name = string("op_128"), val = tensor([1, 77, -1, 64])]; tensor var_129_cast_fp16 = reshape(shape = var_128, x = linear_1_cast_fp16)[name = string("op_129_cast_fp16")]; tensor var_131 = const()[name = string("op_131"), val = tensor([1, 77, -1, 64])]; tensor var_132_cast_fp16 = reshape(shape = var_131, x = linear_2_cast_fp16)[name = string("op_132_cast_fp16")]; tensor value_1_perm_0 = const()[name = string("value_1_perm_0"), val = tensor([0, 2, -3, -1])]; fp16 var_11_to_fp16 = const()[name = string("op_11_to_fp16"), val = fp16(0x1p-3)]; tensor mul_1_cast_fp16 = mul(x = var_126_cast_fp16, y = var_11_to_fp16)[name = string("mul_1_cast_fp16")]; bool matmul_0_transpose_y_0 = const()[name = string("matmul_0_transpose_y_0"), val = bool(true)]; bool matmul_0_transpose_x_0 = const()[name = string("matmul_0_transpose_x_0"), val = bool(false)]; tensor transpose_128_perm_0 = const()[name = string("transpose_128_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129_perm_0 = const()[name = string("transpose_129_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129 = transpose(perm = transpose_129_perm_0, x = var_129_cast_fp16)[name = string("transpose_318")]; tensor transpose_128 = transpose(perm = transpose_128_perm_0, x = mul_1_cast_fp16)[name = string("transpose_319")]; tensor matmul_0_cast_fp16 = matmul(transpose_x = matmul_0_transpose_x_0, transpose_y = matmul_0_transpose_y_0, x = transpose_128, y = transpose_129)[name = string("matmul_0_cast_fp16")]; tensor mul_0_to_fp16 = const()[name = string("mul_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51754944)))]; tensor add_0_cast_fp16 = add(x = matmul_0_cast_fp16, y = mul_0_to_fp16)[name = string("add_0_cast_fp16")]; int32 softmax_0_axis_0 = const()[name = string("softmax_0_axis_0"), val = int32(-1)]; tensor softmax_0_cast_fp16 = softmax(axis = softmax_0_axis_0, x = add_0_cast_fp16)[name = string("softmax_0_cast_fp16")]; bool attn_output_1_transpose_x_0 = const()[name = string("attn_output_1_transpose_x_0"), val = bool(false)]; bool attn_output_1_transpose_y_0 = const()[name = string("attn_output_1_transpose_y_0"), val = bool(false)]; tensor value_1_cast_fp16 = transpose(perm = value_1_perm_0, x = var_132_cast_fp16)[name = string("transpose_317")]; tensor attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = softmax_0_cast_fp16, y = value_1_cast_fp16)[name = string("attn_output_1_cast_fp16")]; tensor var_135_perm_0 = const()[name = string("op_135_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_137 = const()[name = string("op_137"), val = tensor([1, 77, -1])]; tensor var_135_cast_fp16 = transpose(perm = var_135_perm_0, x = attn_output_1_cast_fp16)[name = string("transpose_316")]; tensor var_138_cast_fp16 = reshape(shape = var_137, x = var_135_cast_fp16)[name = string("op_138_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51766912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(52995776))))[name = string("encoder_text_model_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(53006080)))]; tensor linear_3_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_self_attn_out_proj_weight_to_fp16_palettized, x = var_138_cast_fp16)[name = string("linear_3_cast_fp16")]; tensor input_7_cast_fp16 = add(x = input_3_cast_fp16, y = linear_3_cast_fp16)[name = string("input_7_cast_fp16")]; tensor input_9_axes_0 = const()[name = string("input_9_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_0_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(53008704)))]; tensor encoder_text_model_encoder_layers_0_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(53011328)))]; tensor input_9_cast_fp16 = layer_norm(axes = input_9_axes_0, beta = encoder_text_model_encoder_layers_0_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_0_layer_norm2_weight_to_fp16, x = input_7_cast_fp16)[name = string("input_9_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(53013952))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57929216))))[name = string("encoder_text_model_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57970240)))]; tensor linear_4_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_mlp_fc1_weight_to_fp16_palettized, x = input_9_cast_fp16)[name = string("linear_4_cast_fp16")]; string input_13_mode_0 = const()[name = string("input_13_mode_0"), val = string("EXACT")]; tensor input_13_cast_fp16 = gelu(mode = input_13_mode_0, x = linear_4_cast_fp16)[name = string("input_13_cast_fp16")]; tensor encoder_text_model_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(57980544))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62895808))))[name = string("encoder_text_model_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_0_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_0_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62906112)))]; tensor linear_5_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_0_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_0_mlp_fc2_weight_to_fp16_palettized, x = input_13_cast_fp16)[name = string("linear_5_cast_fp16")]; tensor input_15_cast_fp16 = add(x = input_7_cast_fp16, y = linear_5_cast_fp16)[name = string("input_15_cast_fp16")]; tensor hidden_states_7_axes_0 = const()[name = string("hidden_states_7_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_1_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62908736)))]; tensor encoder_text_model_encoder_layers_1_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62911360)))]; tensor hidden_states_7_cast_fp16 = layer_norm(axes = hidden_states_7_axes_0, beta = encoder_text_model_encoder_layers_1_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_1_layer_norm1_weight_to_fp16, x = input_15_cast_fp16)[name = string("hidden_states_7_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62913984))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64142848))))[name = string("encoder_text_model_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64153152)))]; tensor linear_6_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_6_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64155776))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(65384640))))[name = string("encoder_text_model_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(65394944)))]; tensor linear_7_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_7_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(65397568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66626432))))[name = string("encoder_text_model_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66636736)))]; tensor linear_8_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_7_cast_fp16)[name = string("linear_8_cast_fp16")]; tensor var_181 = const()[name = string("op_181"), val = tensor([1, 77, -1, 64])]; tensor var_182_cast_fp16 = reshape(shape = var_181, x = linear_6_cast_fp16)[name = string("op_182_cast_fp16")]; tensor var_184 = const()[name = string("op_184"), val = tensor([1, 77, -1, 64])]; tensor var_185_cast_fp16 = reshape(shape = var_184, x = linear_7_cast_fp16)[name = string("op_185_cast_fp16")]; tensor var_187 = const()[name = string("op_187"), val = tensor([1, 77, -1, 64])]; tensor var_188_cast_fp16 = reshape(shape = var_187, x = linear_8_cast_fp16)[name = string("op_188_cast_fp16")]; tensor value_3_perm_0 = const()[name = string("value_3_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_3_cast_fp16 = mul(x = var_182_cast_fp16, y = var_11_to_fp16)[name = string("mul_3_cast_fp16")]; bool matmul_1_transpose_y_0 = const()[name = string("matmul_1_transpose_y_0"), val = bool(true)]; bool matmul_1_transpose_x_0 = const()[name = string("matmul_1_transpose_x_0"), val = bool(false)]; tensor transpose_130_perm_0 = const()[name = string("transpose_130_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131_perm_0 = const()[name = string("transpose_131_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131 = transpose(perm = transpose_131_perm_0, x = var_185_cast_fp16)[name = string("transpose_314")]; tensor transpose_130 = transpose(perm = transpose_130_perm_0, x = mul_3_cast_fp16)[name = string("transpose_315")]; tensor matmul_1_cast_fp16 = matmul(transpose_x = matmul_1_transpose_x_0, transpose_y = matmul_1_transpose_y_0, x = transpose_130, y = transpose_131)[name = string("matmul_1_cast_fp16")]; tensor add_1_cast_fp16 = add(x = matmul_1_cast_fp16, y = mul_0_to_fp16)[name = string("add_1_cast_fp16")]; int32 softmax_1_axis_0 = const()[name = string("softmax_1_axis_0"), val = int32(-1)]; tensor softmax_1_cast_fp16 = softmax(axis = softmax_1_axis_0, x = add_1_cast_fp16)[name = string("softmax_1_cast_fp16")]; bool attn_output_5_transpose_x_0 = const()[name = string("attn_output_5_transpose_x_0"), val = bool(false)]; bool attn_output_5_transpose_y_0 = const()[name = string("attn_output_5_transpose_y_0"), val = bool(false)]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = var_188_cast_fp16)[name = string("transpose_313")]; tensor attn_output_5_cast_fp16 = matmul(transpose_x = attn_output_5_transpose_x_0, transpose_y = attn_output_5_transpose_y_0, x = softmax_1_cast_fp16, y = value_3_cast_fp16)[name = string("attn_output_5_cast_fp16")]; tensor var_191_perm_0 = const()[name = string("op_191_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_193 = const()[name = string("op_193"), val = tensor([1, 77, -1])]; tensor var_191_cast_fp16 = transpose(perm = var_191_perm_0, x = attn_output_5_cast_fp16)[name = string("transpose_312")]; tensor var_194_cast_fp16 = reshape(shape = var_193, x = var_191_cast_fp16)[name = string("op_194_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66639360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67868224))))[name = string("encoder_text_model_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67878528)))]; tensor linear_9_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_self_attn_out_proj_weight_to_fp16_palettized, x = var_194_cast_fp16)[name = string("linear_9_cast_fp16")]; tensor input_19_cast_fp16 = add(x = input_15_cast_fp16, y = linear_9_cast_fp16)[name = string("input_19_cast_fp16")]; tensor input_21_axes_0 = const()[name = string("input_21_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_1_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67881152)))]; tensor encoder_text_model_encoder_layers_1_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67883776)))]; tensor input_21_cast_fp16 = layer_norm(axes = input_21_axes_0, beta = encoder_text_model_encoder_layers_1_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_1_layer_norm2_weight_to_fp16, x = input_19_cast_fp16)[name = string("input_21_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(67886400))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72801664))))[name = string("encoder_text_model_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72842688)))]; tensor linear_10_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_mlp_fc1_weight_to_fp16_palettized, x = input_21_cast_fp16)[name = string("linear_10_cast_fp16")]; string input_25_mode_0 = const()[name = string("input_25_mode_0"), val = string("EXACT")]; tensor input_25_cast_fp16 = gelu(mode = input_25_mode_0, x = linear_10_cast_fp16)[name = string("input_25_cast_fp16")]; tensor encoder_text_model_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(72852992))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77768256))))[name = string("encoder_text_model_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_1_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_1_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77778560)))]; tensor linear_11_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_1_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_1_mlp_fc2_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = string("linear_11_cast_fp16")]; tensor input_27_cast_fp16 = add(x = input_19_cast_fp16, y = linear_11_cast_fp16)[name = string("input_27_cast_fp16")]; tensor hidden_states_13_axes_0 = const()[name = string("hidden_states_13_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_2_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77781184)))]; tensor encoder_text_model_encoder_layers_2_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77783808)))]; tensor hidden_states_13_cast_fp16 = layer_norm(axes = hidden_states_13_axes_0, beta = encoder_text_model_encoder_layers_2_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_2_layer_norm1_weight_to_fp16, x = input_27_cast_fp16)[name = string("hidden_states_13_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77786432))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79015296))))[name = string("encoder_text_model_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79025600)))]; tensor linear_12_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_12_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(79028224))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(80257088))))[name = string("encoder_text_model_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(80267392)))]; tensor linear_13_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_13_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(80270016))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81498880))))[name = string("encoder_text_model_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81509184)))]; tensor linear_14_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_13_cast_fp16)[name = string("linear_14_cast_fp16")]; tensor var_237 = const()[name = string("op_237"), val = tensor([1, 77, -1, 64])]; tensor var_238_cast_fp16 = reshape(shape = var_237, x = linear_12_cast_fp16)[name = string("op_238_cast_fp16")]; tensor var_240 = const()[name = string("op_240"), val = tensor([1, 77, -1, 64])]; tensor var_241_cast_fp16 = reshape(shape = var_240, x = linear_13_cast_fp16)[name = string("op_241_cast_fp16")]; tensor var_243 = const()[name = string("op_243"), val = tensor([1, 77, -1, 64])]; tensor var_244_cast_fp16 = reshape(shape = var_243, x = linear_14_cast_fp16)[name = string("op_244_cast_fp16")]; tensor value_5_perm_0 = const()[name = string("value_5_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_5_cast_fp16 = mul(x = var_238_cast_fp16, y = var_11_to_fp16)[name = string("mul_5_cast_fp16")]; bool matmul_2_transpose_y_0 = const()[name = string("matmul_2_transpose_y_0"), val = bool(true)]; bool matmul_2_transpose_x_0 = const()[name = string("matmul_2_transpose_x_0"), val = bool(false)]; tensor transpose_132_perm_0 = const()[name = string("transpose_132_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133_perm_0 = const()[name = string("transpose_133_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133 = transpose(perm = transpose_133_perm_0, x = var_241_cast_fp16)[name = string("transpose_310")]; tensor transpose_132 = transpose(perm = transpose_132_perm_0, x = mul_5_cast_fp16)[name = string("transpose_311")]; tensor matmul_2_cast_fp16 = matmul(transpose_x = matmul_2_transpose_x_0, transpose_y = matmul_2_transpose_y_0, x = transpose_132, y = transpose_133)[name = string("matmul_2_cast_fp16")]; tensor add_2_cast_fp16 = add(x = matmul_2_cast_fp16, y = mul_0_to_fp16)[name = string("add_2_cast_fp16")]; int32 softmax_2_axis_0 = const()[name = string("softmax_2_axis_0"), val = int32(-1)]; tensor softmax_2_cast_fp16 = softmax(axis = softmax_2_axis_0, x = add_2_cast_fp16)[name = string("softmax_2_cast_fp16")]; bool attn_output_9_transpose_x_0 = const()[name = string("attn_output_9_transpose_x_0"), val = bool(false)]; bool attn_output_9_transpose_y_0 = const()[name = string("attn_output_9_transpose_y_0"), val = bool(false)]; tensor value_5_cast_fp16 = transpose(perm = value_5_perm_0, x = var_244_cast_fp16)[name = string("transpose_309")]; tensor attn_output_9_cast_fp16 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = softmax_2_cast_fp16, y = value_5_cast_fp16)[name = string("attn_output_9_cast_fp16")]; tensor var_247_perm_0 = const()[name = string("op_247_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_249 = const()[name = string("op_249"), val = tensor([1, 77, -1])]; tensor var_247_cast_fp16 = transpose(perm = var_247_perm_0, x = attn_output_9_cast_fp16)[name = string("transpose_308")]; tensor var_250_cast_fp16 = reshape(shape = var_249, x = var_247_cast_fp16)[name = string("op_250_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(81511808))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82740672))))[name = string("encoder_text_model_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82750976)))]; tensor linear_15_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_self_attn_out_proj_weight_to_fp16_palettized, x = var_250_cast_fp16)[name = string("linear_15_cast_fp16")]; tensor input_31_cast_fp16 = add(x = input_27_cast_fp16, y = linear_15_cast_fp16)[name = string("input_31_cast_fp16")]; tensor input_33_axes_0 = const()[name = string("input_33_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_2_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82753600)))]; tensor encoder_text_model_encoder_layers_2_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82756224)))]; tensor input_33_cast_fp16 = layer_norm(axes = input_33_axes_0, beta = encoder_text_model_encoder_layers_2_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_2_layer_norm2_weight_to_fp16, x = input_31_cast_fp16)[name = string("input_33_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(82758848))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(87674112))))[name = string("encoder_text_model_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(87715136)))]; tensor linear_16_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_mlp_fc1_weight_to_fp16_palettized, x = input_33_cast_fp16)[name = string("linear_16_cast_fp16")]; string input_37_mode_0 = const()[name = string("input_37_mode_0"), val = string("EXACT")]; tensor input_37_cast_fp16 = gelu(mode = input_37_mode_0, x = linear_16_cast_fp16)[name = string("input_37_cast_fp16")]; tensor encoder_text_model_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(87725440))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(92640704))))[name = string("encoder_text_model_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_2_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_2_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(92651008)))]; tensor linear_17_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_2_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_2_mlp_fc2_weight_to_fp16_palettized, x = input_37_cast_fp16)[name = string("linear_17_cast_fp16")]; tensor input_39_cast_fp16 = add(x = input_31_cast_fp16, y = linear_17_cast_fp16)[name = string("input_39_cast_fp16")]; tensor hidden_states_19_axes_0 = const()[name = string("hidden_states_19_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_3_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(92653632)))]; tensor encoder_text_model_encoder_layers_3_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(92656256)))]; tensor hidden_states_19_cast_fp16 = layer_norm(axes = hidden_states_19_axes_0, beta = encoder_text_model_encoder_layers_3_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_3_layer_norm1_weight_to_fp16, x = input_39_cast_fp16)[name = string("hidden_states_19_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(92658880))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93887744))))[name = string("encoder_text_model_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93898048)))]; tensor linear_18_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_18_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93900672))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(95129536))))[name = string("encoder_text_model_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(95139840)))]; tensor linear_19_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_19_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(95142464))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(96371328))))[name = string("encoder_text_model_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(96381632)))]; tensor linear_20_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_19_cast_fp16)[name = string("linear_20_cast_fp16")]; tensor var_293 = const()[name = string("op_293"), val = tensor([1, 77, -1, 64])]; tensor var_294_cast_fp16 = reshape(shape = var_293, x = linear_18_cast_fp16)[name = string("op_294_cast_fp16")]; tensor var_296 = const()[name = string("op_296"), val = tensor([1, 77, -1, 64])]; tensor var_297_cast_fp16 = reshape(shape = var_296, x = linear_19_cast_fp16)[name = string("op_297_cast_fp16")]; tensor var_299 = const()[name = string("op_299"), val = tensor([1, 77, -1, 64])]; tensor var_300_cast_fp16 = reshape(shape = var_299, x = linear_20_cast_fp16)[name = string("op_300_cast_fp16")]; tensor value_7_perm_0 = const()[name = string("value_7_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_7_cast_fp16 = mul(x = var_294_cast_fp16, y = var_11_to_fp16)[name = string("mul_7_cast_fp16")]; bool matmul_3_transpose_y_0 = const()[name = string("matmul_3_transpose_y_0"), val = bool(true)]; bool matmul_3_transpose_x_0 = const()[name = string("matmul_3_transpose_x_0"), val = bool(false)]; tensor transpose_134_perm_0 = const()[name = string("transpose_134_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135_perm_0 = const()[name = string("transpose_135_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135 = transpose(perm = transpose_135_perm_0, x = var_297_cast_fp16)[name = string("transpose_306")]; tensor transpose_134 = transpose(perm = transpose_134_perm_0, x = mul_7_cast_fp16)[name = string("transpose_307")]; tensor matmul_3_cast_fp16 = matmul(transpose_x = matmul_3_transpose_x_0, transpose_y = matmul_3_transpose_y_0, x = transpose_134, y = transpose_135)[name = string("matmul_3_cast_fp16")]; tensor add_3_cast_fp16 = add(x = matmul_3_cast_fp16, y = mul_0_to_fp16)[name = string("add_3_cast_fp16")]; int32 softmax_3_axis_0 = const()[name = string("softmax_3_axis_0"), val = int32(-1)]; tensor softmax_3_cast_fp16 = softmax(axis = softmax_3_axis_0, x = add_3_cast_fp16)[name = string("softmax_3_cast_fp16")]; bool attn_output_13_transpose_x_0 = const()[name = string("attn_output_13_transpose_x_0"), val = bool(false)]; bool attn_output_13_transpose_y_0 = const()[name = string("attn_output_13_transpose_y_0"), val = bool(false)]; tensor value_7_cast_fp16 = transpose(perm = value_7_perm_0, x = var_300_cast_fp16)[name = string("transpose_305")]; tensor attn_output_13_cast_fp16 = matmul(transpose_x = attn_output_13_transpose_x_0, transpose_y = attn_output_13_transpose_y_0, x = softmax_3_cast_fp16, y = value_7_cast_fp16)[name = string("attn_output_13_cast_fp16")]; tensor var_303_perm_0 = const()[name = string("op_303_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_305 = const()[name = string("op_305"), val = tensor([1, 77, -1])]; tensor var_303_cast_fp16 = transpose(perm = var_303_perm_0, x = attn_output_13_cast_fp16)[name = string("transpose_304")]; tensor var_306_cast_fp16 = reshape(shape = var_305, x = var_303_cast_fp16)[name = string("op_306_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(96384256))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(97613120))))[name = string("encoder_text_model_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(97623424)))]; tensor linear_21_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_self_attn_out_proj_weight_to_fp16_palettized, x = var_306_cast_fp16)[name = string("linear_21_cast_fp16")]; tensor input_43_cast_fp16 = add(x = input_39_cast_fp16, y = linear_21_cast_fp16)[name = string("input_43_cast_fp16")]; tensor input_45_axes_0 = const()[name = string("input_45_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_3_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(97626048)))]; tensor encoder_text_model_encoder_layers_3_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(97628672)))]; tensor input_45_cast_fp16 = layer_norm(axes = input_45_axes_0, beta = encoder_text_model_encoder_layers_3_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_3_layer_norm2_weight_to_fp16, x = input_43_cast_fp16)[name = string("input_45_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(97631296))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(102546560))))[name = string("encoder_text_model_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(102587584)))]; tensor linear_22_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_mlp_fc1_weight_to_fp16_palettized, x = input_45_cast_fp16)[name = string("linear_22_cast_fp16")]; string input_49_mode_0 = const()[name = string("input_49_mode_0"), val = string("EXACT")]; tensor input_49_cast_fp16 = gelu(mode = input_49_mode_0, x = linear_22_cast_fp16)[name = string("input_49_cast_fp16")]; tensor encoder_text_model_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(102597888))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(107513152))))[name = string("encoder_text_model_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_3_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_3_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(107523456)))]; tensor linear_23_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_3_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_3_mlp_fc2_weight_to_fp16_palettized, x = input_49_cast_fp16)[name = string("linear_23_cast_fp16")]; tensor input_51_cast_fp16 = add(x = input_43_cast_fp16, y = linear_23_cast_fp16)[name = string("input_51_cast_fp16")]; tensor hidden_states_25_axes_0 = const()[name = string("hidden_states_25_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_4_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(107526080)))]; tensor encoder_text_model_encoder_layers_4_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(107528704)))]; tensor hidden_states_25_cast_fp16 = layer_norm(axes = hidden_states_25_axes_0, beta = encoder_text_model_encoder_layers_4_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_4_layer_norm1_weight_to_fp16, x = input_51_cast_fp16)[name = string("hidden_states_25_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(107531328))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(108760192))))[name = string("encoder_text_model_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(108770496)))]; tensor linear_24_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_24_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(108773120))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110001984))))[name = string("encoder_text_model_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110012288)))]; tensor linear_25_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_25_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110014912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(111243776))))[name = string("encoder_text_model_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(111254080)))]; tensor linear_26_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_25_cast_fp16)[name = string("linear_26_cast_fp16")]; tensor var_349 = const()[name = string("op_349"), val = tensor([1, 77, -1, 64])]; tensor var_350_cast_fp16 = reshape(shape = var_349, x = linear_24_cast_fp16)[name = string("op_350_cast_fp16")]; tensor var_352 = const()[name = string("op_352"), val = tensor([1, 77, -1, 64])]; tensor var_353_cast_fp16 = reshape(shape = var_352, x = linear_25_cast_fp16)[name = string("op_353_cast_fp16")]; tensor var_355 = const()[name = string("op_355"), val = tensor([1, 77, -1, 64])]; tensor var_356_cast_fp16 = reshape(shape = var_355, x = linear_26_cast_fp16)[name = string("op_356_cast_fp16")]; tensor value_9_perm_0 = const()[name = string("value_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_9_cast_fp16 = mul(x = var_350_cast_fp16, y = var_11_to_fp16)[name = string("mul_9_cast_fp16")]; bool matmul_4_transpose_y_0 = const()[name = string("matmul_4_transpose_y_0"), val = bool(true)]; bool matmul_4_transpose_x_0 = const()[name = string("matmul_4_transpose_x_0"), val = bool(false)]; tensor transpose_136_perm_0 = const()[name = string("transpose_136_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137_perm_0 = const()[name = string("transpose_137_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137 = transpose(perm = transpose_137_perm_0, x = var_353_cast_fp16)[name = string("transpose_302")]; tensor transpose_136 = transpose(perm = transpose_136_perm_0, x = mul_9_cast_fp16)[name = string("transpose_303")]; tensor matmul_4_cast_fp16 = matmul(transpose_x = matmul_4_transpose_x_0, transpose_y = matmul_4_transpose_y_0, x = transpose_136, y = transpose_137)[name = string("matmul_4_cast_fp16")]; tensor add_4_cast_fp16 = add(x = matmul_4_cast_fp16, y = mul_0_to_fp16)[name = string("add_4_cast_fp16")]; int32 softmax_4_axis_0 = const()[name = string("softmax_4_axis_0"), val = int32(-1)]; tensor softmax_4_cast_fp16 = softmax(axis = softmax_4_axis_0, x = add_4_cast_fp16)[name = string("softmax_4_cast_fp16")]; bool attn_output_17_transpose_x_0 = const()[name = string("attn_output_17_transpose_x_0"), val = bool(false)]; bool attn_output_17_transpose_y_0 = const()[name = string("attn_output_17_transpose_y_0"), val = bool(false)]; tensor value_9_cast_fp16 = transpose(perm = value_9_perm_0, x = var_356_cast_fp16)[name = string("transpose_301")]; tensor attn_output_17_cast_fp16 = matmul(transpose_x = attn_output_17_transpose_x_0, transpose_y = attn_output_17_transpose_y_0, x = softmax_4_cast_fp16, y = value_9_cast_fp16)[name = string("attn_output_17_cast_fp16")]; tensor var_359_perm_0 = const()[name = string("op_359_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_361 = const()[name = string("op_361"), val = tensor([1, 77, -1])]; tensor var_359_cast_fp16 = transpose(perm = var_359_perm_0, x = attn_output_17_cast_fp16)[name = string("transpose_300")]; tensor var_362_cast_fp16 = reshape(shape = var_361, x = var_359_cast_fp16)[name = string("op_362_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(111256704))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112485568))))[name = string("encoder_text_model_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112495872)))]; tensor linear_27_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_self_attn_out_proj_weight_to_fp16_palettized, x = var_362_cast_fp16)[name = string("linear_27_cast_fp16")]; tensor input_55_cast_fp16 = add(x = input_51_cast_fp16, y = linear_27_cast_fp16)[name = string("input_55_cast_fp16")]; tensor input_57_axes_0 = const()[name = string("input_57_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_4_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112498496)))]; tensor encoder_text_model_encoder_layers_4_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112501120)))]; tensor input_57_cast_fp16 = layer_norm(axes = input_57_axes_0, beta = encoder_text_model_encoder_layers_4_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_4_layer_norm2_weight_to_fp16, x = input_55_cast_fp16)[name = string("input_57_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112503744))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(117419008))))[name = string("encoder_text_model_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(117460032)))]; tensor linear_28_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_mlp_fc1_weight_to_fp16_palettized, x = input_57_cast_fp16)[name = string("linear_28_cast_fp16")]; string input_61_mode_0 = const()[name = string("input_61_mode_0"), val = string("EXACT")]; tensor input_61_cast_fp16 = gelu(mode = input_61_mode_0, x = linear_28_cast_fp16)[name = string("input_61_cast_fp16")]; tensor encoder_text_model_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(117470336))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(122385600))))[name = string("encoder_text_model_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_4_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_4_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(122395904)))]; tensor linear_29_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_4_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_4_mlp_fc2_weight_to_fp16_palettized, x = input_61_cast_fp16)[name = string("linear_29_cast_fp16")]; tensor input_63_cast_fp16 = add(x = input_55_cast_fp16, y = linear_29_cast_fp16)[name = string("input_63_cast_fp16")]; tensor hidden_states_31_axes_0 = const()[name = string("hidden_states_31_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_5_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(122398528)))]; tensor encoder_text_model_encoder_layers_5_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(122401152)))]; tensor hidden_states_31_cast_fp16 = layer_norm(axes = hidden_states_31_axes_0, beta = encoder_text_model_encoder_layers_5_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_5_layer_norm1_weight_to_fp16, x = input_63_cast_fp16)[name = string("hidden_states_31_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(122403776))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(123632640))))[name = string("encoder_text_model_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(123642944)))]; tensor linear_30_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_30_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(123645568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(124874432))))[name = string("encoder_text_model_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(124884736)))]; tensor linear_31_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_31_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(124887360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(126116224))))[name = string("encoder_text_model_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(126126528)))]; tensor linear_32_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_31_cast_fp16)[name = string("linear_32_cast_fp16")]; tensor var_405 = const()[name = string("op_405"), val = tensor([1, 77, -1, 64])]; tensor var_406_cast_fp16 = reshape(shape = var_405, x = linear_30_cast_fp16)[name = string("op_406_cast_fp16")]; tensor var_408 = const()[name = string("op_408"), val = tensor([1, 77, -1, 64])]; tensor var_409_cast_fp16 = reshape(shape = var_408, x = linear_31_cast_fp16)[name = string("op_409_cast_fp16")]; tensor var_411 = const()[name = string("op_411"), val = tensor([1, 77, -1, 64])]; tensor var_412_cast_fp16 = reshape(shape = var_411, x = linear_32_cast_fp16)[name = string("op_412_cast_fp16")]; tensor value_11_perm_0 = const()[name = string("value_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_11_cast_fp16 = mul(x = var_406_cast_fp16, y = var_11_to_fp16)[name = string("mul_11_cast_fp16")]; bool matmul_5_transpose_y_0 = const()[name = string("matmul_5_transpose_y_0"), val = bool(true)]; bool matmul_5_transpose_x_0 = const()[name = string("matmul_5_transpose_x_0"), val = bool(false)]; tensor transpose_138_perm_0 = const()[name = string("transpose_138_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139_perm_0 = const()[name = string("transpose_139_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139 = transpose(perm = transpose_139_perm_0, x = var_409_cast_fp16)[name = string("transpose_298")]; tensor transpose_138 = transpose(perm = transpose_138_perm_0, x = mul_11_cast_fp16)[name = string("transpose_299")]; tensor matmul_5_cast_fp16 = matmul(transpose_x = matmul_5_transpose_x_0, transpose_y = matmul_5_transpose_y_0, x = transpose_138, y = transpose_139)[name = string("matmul_5_cast_fp16")]; tensor add_5_cast_fp16 = add(x = matmul_5_cast_fp16, y = mul_0_to_fp16)[name = string("add_5_cast_fp16")]; int32 softmax_5_axis_0 = const()[name = string("softmax_5_axis_0"), val = int32(-1)]; tensor softmax_5_cast_fp16 = softmax(axis = softmax_5_axis_0, x = add_5_cast_fp16)[name = string("softmax_5_cast_fp16")]; bool attn_output_21_transpose_x_0 = const()[name = string("attn_output_21_transpose_x_0"), val = bool(false)]; bool attn_output_21_transpose_y_0 = const()[name = string("attn_output_21_transpose_y_0"), val = bool(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = var_412_cast_fp16)[name = string("transpose_297")]; tensor attn_output_21_cast_fp16 = matmul(transpose_x = attn_output_21_transpose_x_0, transpose_y = attn_output_21_transpose_y_0, x = softmax_5_cast_fp16, y = value_11_cast_fp16)[name = string("attn_output_21_cast_fp16")]; tensor var_415_perm_0 = const()[name = string("op_415_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_417 = const()[name = string("op_417"), val = tensor([1, 77, -1])]; tensor var_415_cast_fp16 = transpose(perm = var_415_perm_0, x = attn_output_21_cast_fp16)[name = string("transpose_296")]; tensor var_418_cast_fp16 = reshape(shape = var_417, x = var_415_cast_fp16)[name = string("op_418_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(126129152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(127358016))))[name = string("encoder_text_model_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(127368320)))]; tensor linear_33_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_self_attn_out_proj_weight_to_fp16_palettized, x = var_418_cast_fp16)[name = string("linear_33_cast_fp16")]; tensor input_67_cast_fp16 = add(x = input_63_cast_fp16, y = linear_33_cast_fp16)[name = string("input_67_cast_fp16")]; tensor input_69_axes_0 = const()[name = string("input_69_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_5_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(127370944)))]; tensor encoder_text_model_encoder_layers_5_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(127373568)))]; tensor input_69_cast_fp16 = layer_norm(axes = input_69_axes_0, beta = encoder_text_model_encoder_layers_5_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_5_layer_norm2_weight_to_fp16, x = input_67_cast_fp16)[name = string("input_69_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(127376192))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(132291456))))[name = string("encoder_text_model_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(132332480)))]; tensor linear_34_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_mlp_fc1_weight_to_fp16_palettized, x = input_69_cast_fp16)[name = string("linear_34_cast_fp16")]; string input_73_mode_0 = const()[name = string("input_73_mode_0"), val = string("EXACT")]; tensor input_73_cast_fp16 = gelu(mode = input_73_mode_0, x = linear_34_cast_fp16)[name = string("input_73_cast_fp16")]; tensor encoder_text_model_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(132342784))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(137258048))))[name = string("encoder_text_model_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_5_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_5_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(137268352)))]; tensor linear_35_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_5_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_5_mlp_fc2_weight_to_fp16_palettized, x = input_73_cast_fp16)[name = string("linear_35_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_67_cast_fp16, y = linear_35_cast_fp16)[name = string("input_75_cast_fp16")]; tensor hidden_states_37_axes_0 = const()[name = string("hidden_states_37_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_6_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(137270976)))]; tensor encoder_text_model_encoder_layers_6_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(137273600)))]; tensor hidden_states_37_cast_fp16 = layer_norm(axes = hidden_states_37_axes_0, beta = encoder_text_model_encoder_layers_6_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_6_layer_norm1_weight_to_fp16, x = input_75_cast_fp16)[name = string("hidden_states_37_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(137276224))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(138505088))))[name = string("encoder_text_model_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(138515392)))]; tensor linear_36_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_36_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(138518016))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(139746880))))[name = string("encoder_text_model_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(139757184)))]; tensor linear_37_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_37_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(139759808))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(140988672))))[name = string("encoder_text_model_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(140998976)))]; tensor linear_38_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_37_cast_fp16)[name = string("linear_38_cast_fp16")]; tensor var_461 = const()[name = string("op_461"), val = tensor([1, 77, -1, 64])]; tensor var_462_cast_fp16 = reshape(shape = var_461, x = linear_36_cast_fp16)[name = string("op_462_cast_fp16")]; tensor var_464 = const()[name = string("op_464"), val = tensor([1, 77, -1, 64])]; tensor var_465_cast_fp16 = reshape(shape = var_464, x = linear_37_cast_fp16)[name = string("op_465_cast_fp16")]; tensor var_467 = const()[name = string("op_467"), val = tensor([1, 77, -1, 64])]; tensor var_468_cast_fp16 = reshape(shape = var_467, x = linear_38_cast_fp16)[name = string("op_468_cast_fp16")]; tensor value_13_perm_0 = const()[name = string("value_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_13_cast_fp16 = mul(x = var_462_cast_fp16, y = var_11_to_fp16)[name = string("mul_13_cast_fp16")]; bool matmul_6_transpose_y_0 = const()[name = string("matmul_6_transpose_y_0"), val = bool(true)]; bool matmul_6_transpose_x_0 = const()[name = string("matmul_6_transpose_x_0"), val = bool(false)]; tensor transpose_140_perm_0 = const()[name = string("transpose_140_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141_perm_0 = const()[name = string("transpose_141_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141 = transpose(perm = transpose_141_perm_0, x = var_465_cast_fp16)[name = string("transpose_294")]; tensor transpose_140 = transpose(perm = transpose_140_perm_0, x = mul_13_cast_fp16)[name = string("transpose_295")]; tensor matmul_6_cast_fp16 = matmul(transpose_x = matmul_6_transpose_x_0, transpose_y = matmul_6_transpose_y_0, x = transpose_140, y = transpose_141)[name = string("matmul_6_cast_fp16")]; tensor add_6_cast_fp16 = add(x = matmul_6_cast_fp16, y = mul_0_to_fp16)[name = string("add_6_cast_fp16")]; int32 softmax_6_axis_0 = const()[name = string("softmax_6_axis_0"), val = int32(-1)]; tensor softmax_6_cast_fp16 = softmax(axis = softmax_6_axis_0, x = add_6_cast_fp16)[name = string("softmax_6_cast_fp16")]; bool attn_output_25_transpose_x_0 = const()[name = string("attn_output_25_transpose_x_0"), val = bool(false)]; bool attn_output_25_transpose_y_0 = const()[name = string("attn_output_25_transpose_y_0"), val = bool(false)]; tensor value_13_cast_fp16 = transpose(perm = value_13_perm_0, x = var_468_cast_fp16)[name = string("transpose_293")]; tensor attn_output_25_cast_fp16 = matmul(transpose_x = attn_output_25_transpose_x_0, transpose_y = attn_output_25_transpose_y_0, x = softmax_6_cast_fp16, y = value_13_cast_fp16)[name = string("attn_output_25_cast_fp16")]; tensor var_471_perm_0 = const()[name = string("op_471_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_473 = const()[name = string("op_473"), val = tensor([1, 77, -1])]; tensor var_471_cast_fp16 = transpose(perm = var_471_perm_0, x = attn_output_25_cast_fp16)[name = string("transpose_292")]; tensor var_474_cast_fp16 = reshape(shape = var_473, x = var_471_cast_fp16)[name = string("op_474_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(141001600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(142230464))))[name = string("encoder_text_model_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(142240768)))]; tensor linear_39_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_self_attn_out_proj_weight_to_fp16_palettized, x = var_474_cast_fp16)[name = string("linear_39_cast_fp16")]; tensor input_79_cast_fp16 = add(x = input_75_cast_fp16, y = linear_39_cast_fp16)[name = string("input_79_cast_fp16")]; tensor input_81_axes_0 = const()[name = string("input_81_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_6_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(142243392)))]; tensor encoder_text_model_encoder_layers_6_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(142246016)))]; tensor input_81_cast_fp16 = layer_norm(axes = input_81_axes_0, beta = encoder_text_model_encoder_layers_6_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_6_layer_norm2_weight_to_fp16, x = input_79_cast_fp16)[name = string("input_81_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(142248640))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(147163904))))[name = string("encoder_text_model_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(147204928)))]; tensor linear_40_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_mlp_fc1_weight_to_fp16_palettized, x = input_81_cast_fp16)[name = string("linear_40_cast_fp16")]; string input_85_mode_0 = const()[name = string("input_85_mode_0"), val = string("EXACT")]; tensor input_85_cast_fp16 = gelu(mode = input_85_mode_0, x = linear_40_cast_fp16)[name = string("input_85_cast_fp16")]; tensor encoder_text_model_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(147215232))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(152130496))))[name = string("encoder_text_model_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_6_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_6_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(152140800)))]; tensor linear_41_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_6_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_6_mlp_fc2_weight_to_fp16_palettized, x = input_85_cast_fp16)[name = string("linear_41_cast_fp16")]; tensor input_87_cast_fp16 = add(x = input_79_cast_fp16, y = linear_41_cast_fp16)[name = string("input_87_cast_fp16")]; tensor hidden_states_43_axes_0 = const()[name = string("hidden_states_43_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_7_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(152143424)))]; tensor encoder_text_model_encoder_layers_7_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(152146048)))]; tensor hidden_states_43_cast_fp16 = layer_norm(axes = hidden_states_43_axes_0, beta = encoder_text_model_encoder_layers_7_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_7_layer_norm1_weight_to_fp16, x = input_87_cast_fp16)[name = string("hidden_states_43_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(152148672))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(153377536))))[name = string("encoder_text_model_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(153387840)))]; tensor linear_42_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_42_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(153390464))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(154619328))))[name = string("encoder_text_model_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(154629632)))]; tensor linear_43_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_43_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(154632256))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(155861120))))[name = string("encoder_text_model_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(155871424)))]; tensor linear_44_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_43_cast_fp16)[name = string("linear_44_cast_fp16")]; tensor var_517 = const()[name = string("op_517"), val = tensor([1, 77, -1, 64])]; tensor var_518_cast_fp16 = reshape(shape = var_517, x = linear_42_cast_fp16)[name = string("op_518_cast_fp16")]; tensor var_520 = const()[name = string("op_520"), val = tensor([1, 77, -1, 64])]; tensor var_521_cast_fp16 = reshape(shape = var_520, x = linear_43_cast_fp16)[name = string("op_521_cast_fp16")]; tensor var_523 = const()[name = string("op_523"), val = tensor([1, 77, -1, 64])]; tensor var_524_cast_fp16 = reshape(shape = var_523, x = linear_44_cast_fp16)[name = string("op_524_cast_fp16")]; tensor value_15_perm_0 = const()[name = string("value_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_15_cast_fp16 = mul(x = var_518_cast_fp16, y = var_11_to_fp16)[name = string("mul_15_cast_fp16")]; bool matmul_7_transpose_y_0 = const()[name = string("matmul_7_transpose_y_0"), val = bool(true)]; bool matmul_7_transpose_x_0 = const()[name = string("matmul_7_transpose_x_0"), val = bool(false)]; tensor transpose_142_perm_0 = const()[name = string("transpose_142_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143_perm_0 = const()[name = string("transpose_143_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143 = transpose(perm = transpose_143_perm_0, x = var_521_cast_fp16)[name = string("transpose_290")]; tensor transpose_142 = transpose(perm = transpose_142_perm_0, x = mul_15_cast_fp16)[name = string("transpose_291")]; tensor matmul_7_cast_fp16 = matmul(transpose_x = matmul_7_transpose_x_0, transpose_y = matmul_7_transpose_y_0, x = transpose_142, y = transpose_143)[name = string("matmul_7_cast_fp16")]; tensor add_7_cast_fp16 = add(x = matmul_7_cast_fp16, y = mul_0_to_fp16)[name = string("add_7_cast_fp16")]; int32 softmax_7_axis_0 = const()[name = string("softmax_7_axis_0"), val = int32(-1)]; tensor softmax_7_cast_fp16 = softmax(axis = softmax_7_axis_0, x = add_7_cast_fp16)[name = string("softmax_7_cast_fp16")]; bool attn_output_29_transpose_x_0 = const()[name = string("attn_output_29_transpose_x_0"), val = bool(false)]; bool attn_output_29_transpose_y_0 = const()[name = string("attn_output_29_transpose_y_0"), val = bool(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = var_524_cast_fp16)[name = string("transpose_289")]; tensor attn_output_29_cast_fp16 = matmul(transpose_x = attn_output_29_transpose_x_0, transpose_y = attn_output_29_transpose_y_0, x = softmax_7_cast_fp16, y = value_15_cast_fp16)[name = string("attn_output_29_cast_fp16")]; tensor var_527_perm_0 = const()[name = string("op_527_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_529 = const()[name = string("op_529"), val = tensor([1, 77, -1])]; tensor var_527_cast_fp16 = transpose(perm = var_527_perm_0, x = attn_output_29_cast_fp16)[name = string("transpose_288")]; tensor var_530_cast_fp16 = reshape(shape = var_529, x = var_527_cast_fp16)[name = string("op_530_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(155874048))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(157102912))))[name = string("encoder_text_model_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(157113216)))]; tensor linear_45_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_self_attn_out_proj_weight_to_fp16_palettized, x = var_530_cast_fp16)[name = string("linear_45_cast_fp16")]; tensor input_91_cast_fp16 = add(x = input_87_cast_fp16, y = linear_45_cast_fp16)[name = string("input_91_cast_fp16")]; tensor input_93_axes_0 = const()[name = string("input_93_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_7_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(157115840)))]; tensor encoder_text_model_encoder_layers_7_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(157118464)))]; tensor input_93_cast_fp16 = layer_norm(axes = input_93_axes_0, beta = encoder_text_model_encoder_layers_7_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_7_layer_norm2_weight_to_fp16, x = input_91_cast_fp16)[name = string("input_93_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(157121088))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(162036352))))[name = string("encoder_text_model_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(162077376)))]; tensor linear_46_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_mlp_fc1_weight_to_fp16_palettized, x = input_93_cast_fp16)[name = string("linear_46_cast_fp16")]; string input_97_mode_0 = const()[name = string("input_97_mode_0"), val = string("EXACT")]; tensor input_97_cast_fp16 = gelu(mode = input_97_mode_0, x = linear_46_cast_fp16)[name = string("input_97_cast_fp16")]; tensor encoder_text_model_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(162087680))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(167002944))))[name = string("encoder_text_model_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_7_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_7_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(167013248)))]; tensor linear_47_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_7_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_7_mlp_fc2_weight_to_fp16_palettized, x = input_97_cast_fp16)[name = string("linear_47_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_91_cast_fp16, y = linear_47_cast_fp16)[name = string("input_99_cast_fp16")]; tensor hidden_states_49_axes_0 = const()[name = string("hidden_states_49_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_8_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(167015872)))]; tensor encoder_text_model_encoder_layers_8_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(167018496)))]; tensor hidden_states_49_cast_fp16 = layer_norm(axes = hidden_states_49_axes_0, beta = encoder_text_model_encoder_layers_8_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_8_layer_norm1_weight_to_fp16, x = input_99_cast_fp16)[name = string("hidden_states_49_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(167021120))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(168249984))))[name = string("encoder_text_model_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(168260288)))]; tensor linear_48_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_48_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(168262912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(169491776))))[name = string("encoder_text_model_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(169502080)))]; tensor linear_49_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_49_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(169504704))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(170733568))))[name = string("encoder_text_model_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(170743872)))]; tensor linear_50_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_49_cast_fp16)[name = string("linear_50_cast_fp16")]; tensor var_573 = const()[name = string("op_573"), val = tensor([1, 77, -1, 64])]; tensor var_574_cast_fp16 = reshape(shape = var_573, x = linear_48_cast_fp16)[name = string("op_574_cast_fp16")]; tensor var_576 = const()[name = string("op_576"), val = tensor([1, 77, -1, 64])]; tensor var_577_cast_fp16 = reshape(shape = var_576, x = linear_49_cast_fp16)[name = string("op_577_cast_fp16")]; tensor var_579 = const()[name = string("op_579"), val = tensor([1, 77, -1, 64])]; tensor var_580_cast_fp16 = reshape(shape = var_579, x = linear_50_cast_fp16)[name = string("op_580_cast_fp16")]; tensor value_17_perm_0 = const()[name = string("value_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_17_cast_fp16 = mul(x = var_574_cast_fp16, y = var_11_to_fp16)[name = string("mul_17_cast_fp16")]; bool matmul_8_transpose_y_0 = const()[name = string("matmul_8_transpose_y_0"), val = bool(true)]; bool matmul_8_transpose_x_0 = const()[name = string("matmul_8_transpose_x_0"), val = bool(false)]; tensor transpose_144_perm_0 = const()[name = string("transpose_144_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_145_perm_0 = const()[name = string("transpose_145_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_145 = transpose(perm = transpose_145_perm_0, x = var_577_cast_fp16)[name = string("transpose_286")]; tensor transpose_144 = transpose(perm = transpose_144_perm_0, x = mul_17_cast_fp16)[name = string("transpose_287")]; tensor matmul_8_cast_fp16 = matmul(transpose_x = matmul_8_transpose_x_0, transpose_y = matmul_8_transpose_y_0, x = transpose_144, y = transpose_145)[name = string("matmul_8_cast_fp16")]; tensor add_8_cast_fp16 = add(x = matmul_8_cast_fp16, y = mul_0_to_fp16)[name = string("add_8_cast_fp16")]; int32 softmax_8_axis_0 = const()[name = string("softmax_8_axis_0"), val = int32(-1)]; tensor softmax_8_cast_fp16 = softmax(axis = softmax_8_axis_0, x = add_8_cast_fp16)[name = string("softmax_8_cast_fp16")]; bool attn_output_33_transpose_x_0 = const()[name = string("attn_output_33_transpose_x_0"), val = bool(false)]; bool attn_output_33_transpose_y_0 = const()[name = string("attn_output_33_transpose_y_0"), val = bool(false)]; tensor value_17_cast_fp16 = transpose(perm = value_17_perm_0, x = var_580_cast_fp16)[name = string("transpose_285")]; tensor attn_output_33_cast_fp16 = matmul(transpose_x = attn_output_33_transpose_x_0, transpose_y = attn_output_33_transpose_y_0, x = softmax_8_cast_fp16, y = value_17_cast_fp16)[name = string("attn_output_33_cast_fp16")]; tensor var_583_perm_0 = const()[name = string("op_583_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_585 = const()[name = string("op_585"), val = tensor([1, 77, -1])]; tensor var_583_cast_fp16 = transpose(perm = var_583_perm_0, x = attn_output_33_cast_fp16)[name = string("transpose_284")]; tensor var_586_cast_fp16 = reshape(shape = var_585, x = var_583_cast_fp16)[name = string("op_586_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(170746496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(171975360))))[name = string("encoder_text_model_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(171985664)))]; tensor linear_51_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_self_attn_out_proj_weight_to_fp16_palettized, x = var_586_cast_fp16)[name = string("linear_51_cast_fp16")]; tensor input_103_cast_fp16 = add(x = input_99_cast_fp16, y = linear_51_cast_fp16)[name = string("input_103_cast_fp16")]; tensor input_105_axes_0 = const()[name = string("input_105_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_8_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(171988288)))]; tensor encoder_text_model_encoder_layers_8_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(171990912)))]; tensor input_105_cast_fp16 = layer_norm(axes = input_105_axes_0, beta = encoder_text_model_encoder_layers_8_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_8_layer_norm2_weight_to_fp16, x = input_103_cast_fp16)[name = string("input_105_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(171993536))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(176908800))))[name = string("encoder_text_model_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(176949824)))]; tensor linear_52_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_mlp_fc1_weight_to_fp16_palettized, x = input_105_cast_fp16)[name = string("linear_52_cast_fp16")]; string input_109_mode_0 = const()[name = string("input_109_mode_0"), val = string("EXACT")]; tensor input_109_cast_fp16 = gelu(mode = input_109_mode_0, x = linear_52_cast_fp16)[name = string("input_109_cast_fp16")]; tensor encoder_text_model_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(176960128))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(181875392))))[name = string("encoder_text_model_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_8_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_8_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(181885696)))]; tensor linear_53_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_8_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_8_mlp_fc2_weight_to_fp16_palettized, x = input_109_cast_fp16)[name = string("linear_53_cast_fp16")]; tensor input_111_cast_fp16 = add(x = input_103_cast_fp16, y = linear_53_cast_fp16)[name = string("input_111_cast_fp16")]; tensor hidden_states_55_axes_0 = const()[name = string("hidden_states_55_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_9_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(181888320)))]; tensor encoder_text_model_encoder_layers_9_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(181890944)))]; tensor hidden_states_55_cast_fp16 = layer_norm(axes = hidden_states_55_axes_0, beta = encoder_text_model_encoder_layers_9_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_9_layer_norm1_weight_to_fp16, x = input_111_cast_fp16)[name = string("hidden_states_55_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(181893568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(183122432))))[name = string("encoder_text_model_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(183132736)))]; tensor linear_54_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_54_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(183135360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(184364224))))[name = string("encoder_text_model_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(184374528)))]; tensor linear_55_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_55_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(184377152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(185606016))))[name = string("encoder_text_model_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(185616320)))]; tensor linear_56_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_55_cast_fp16)[name = string("linear_56_cast_fp16")]; tensor var_629 = const()[name = string("op_629"), val = tensor([1, 77, -1, 64])]; tensor var_630_cast_fp16 = reshape(shape = var_629, x = linear_54_cast_fp16)[name = string("op_630_cast_fp16")]; tensor var_632 = const()[name = string("op_632"), val = tensor([1, 77, -1, 64])]; tensor var_633_cast_fp16 = reshape(shape = var_632, x = linear_55_cast_fp16)[name = string("op_633_cast_fp16")]; tensor var_635 = const()[name = string("op_635"), val = tensor([1, 77, -1, 64])]; tensor var_636_cast_fp16 = reshape(shape = var_635, x = linear_56_cast_fp16)[name = string("op_636_cast_fp16")]; tensor value_19_perm_0 = const()[name = string("value_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_19_cast_fp16 = mul(x = var_630_cast_fp16, y = var_11_to_fp16)[name = string("mul_19_cast_fp16")]; bool matmul_9_transpose_y_0 = const()[name = string("matmul_9_transpose_y_0"), val = bool(true)]; bool matmul_9_transpose_x_0 = const()[name = string("matmul_9_transpose_x_0"), val = bool(false)]; tensor transpose_146_perm_0 = const()[name = string("transpose_146_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_147_perm_0 = const()[name = string("transpose_147_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_147 = transpose(perm = transpose_147_perm_0, x = var_633_cast_fp16)[name = string("transpose_282")]; tensor transpose_146 = transpose(perm = transpose_146_perm_0, x = mul_19_cast_fp16)[name = string("transpose_283")]; tensor matmul_9_cast_fp16 = matmul(transpose_x = matmul_9_transpose_x_0, transpose_y = matmul_9_transpose_y_0, x = transpose_146, y = transpose_147)[name = string("matmul_9_cast_fp16")]; tensor add_9_cast_fp16 = add(x = matmul_9_cast_fp16, y = mul_0_to_fp16)[name = string("add_9_cast_fp16")]; int32 softmax_9_axis_0 = const()[name = string("softmax_9_axis_0"), val = int32(-1)]; tensor softmax_9_cast_fp16 = softmax(axis = softmax_9_axis_0, x = add_9_cast_fp16)[name = string("softmax_9_cast_fp16")]; bool attn_output_37_transpose_x_0 = const()[name = string("attn_output_37_transpose_x_0"), val = bool(false)]; bool attn_output_37_transpose_y_0 = const()[name = string("attn_output_37_transpose_y_0"), val = bool(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = var_636_cast_fp16)[name = string("transpose_281")]; tensor attn_output_37_cast_fp16 = matmul(transpose_x = attn_output_37_transpose_x_0, transpose_y = attn_output_37_transpose_y_0, x = softmax_9_cast_fp16, y = value_19_cast_fp16)[name = string("attn_output_37_cast_fp16")]; tensor var_639_perm_0 = const()[name = string("op_639_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_641 = const()[name = string("op_641"), val = tensor([1, 77, -1])]; tensor var_639_cast_fp16 = transpose(perm = var_639_perm_0, x = attn_output_37_cast_fp16)[name = string("transpose_280")]; tensor var_642_cast_fp16 = reshape(shape = var_641, x = var_639_cast_fp16)[name = string("op_642_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(185618944))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(186847808))))[name = string("encoder_text_model_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(186858112)))]; tensor linear_57_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_self_attn_out_proj_weight_to_fp16_palettized, x = var_642_cast_fp16)[name = string("linear_57_cast_fp16")]; tensor input_115_cast_fp16 = add(x = input_111_cast_fp16, y = linear_57_cast_fp16)[name = string("input_115_cast_fp16")]; tensor input_117_axes_0 = const()[name = string("input_117_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_9_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(186860736)))]; tensor encoder_text_model_encoder_layers_9_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(186863360)))]; tensor input_117_cast_fp16 = layer_norm(axes = input_117_axes_0, beta = encoder_text_model_encoder_layers_9_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_9_layer_norm2_weight_to_fp16, x = input_115_cast_fp16)[name = string("input_117_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(186865984))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(191781248))))[name = string("encoder_text_model_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(191822272)))]; tensor linear_58_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_mlp_fc1_weight_to_fp16_palettized, x = input_117_cast_fp16)[name = string("linear_58_cast_fp16")]; string input_121_mode_0 = const()[name = string("input_121_mode_0"), val = string("EXACT")]; tensor input_121_cast_fp16 = gelu(mode = input_121_mode_0, x = linear_58_cast_fp16)[name = string("input_121_cast_fp16")]; tensor encoder_text_model_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(191832576))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(196747840))))[name = string("encoder_text_model_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_9_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_9_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(196758144)))]; tensor linear_59_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_9_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_9_mlp_fc2_weight_to_fp16_palettized, x = input_121_cast_fp16)[name = string("linear_59_cast_fp16")]; tensor input_123_cast_fp16 = add(x = input_115_cast_fp16, y = linear_59_cast_fp16)[name = string("input_123_cast_fp16")]; tensor hidden_states_61_axes_0 = const()[name = string("hidden_states_61_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_10_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(196760768)))]; tensor encoder_text_model_encoder_layers_10_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(196763392)))]; tensor hidden_states_61_cast_fp16 = layer_norm(axes = hidden_states_61_axes_0, beta = encoder_text_model_encoder_layers_10_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_10_layer_norm1_weight_to_fp16, x = input_123_cast_fp16)[name = string("hidden_states_61_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(196766016))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(197994880))))[name = string("encoder_text_model_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(198005184)))]; tensor linear_60_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_60_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(198007808))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(199236672))))[name = string("encoder_text_model_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(199246976)))]; tensor linear_61_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_61_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(199249600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(200478464))))[name = string("encoder_text_model_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(200488768)))]; tensor linear_62_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_61_cast_fp16)[name = string("linear_62_cast_fp16")]; tensor var_685 = const()[name = string("op_685"), val = tensor([1, 77, -1, 64])]; tensor var_686_cast_fp16 = reshape(shape = var_685, x = linear_60_cast_fp16)[name = string("op_686_cast_fp16")]; tensor var_688 = const()[name = string("op_688"), val = tensor([1, 77, -1, 64])]; tensor var_689_cast_fp16 = reshape(shape = var_688, x = linear_61_cast_fp16)[name = string("op_689_cast_fp16")]; tensor var_691 = const()[name = string("op_691"), val = tensor([1, 77, -1, 64])]; tensor var_692_cast_fp16 = reshape(shape = var_691, x = linear_62_cast_fp16)[name = string("op_692_cast_fp16")]; tensor value_21_perm_0 = const()[name = string("value_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_21_cast_fp16 = mul(x = var_686_cast_fp16, y = var_11_to_fp16)[name = string("mul_21_cast_fp16")]; bool matmul_10_transpose_y_0 = const()[name = string("matmul_10_transpose_y_0"), val = bool(true)]; bool matmul_10_transpose_x_0 = const()[name = string("matmul_10_transpose_x_0"), val = bool(false)]; tensor transpose_148_perm_0 = const()[name = string("transpose_148_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_149_perm_0 = const()[name = string("transpose_149_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_149 = transpose(perm = transpose_149_perm_0, x = var_689_cast_fp16)[name = string("transpose_278")]; tensor transpose_148 = transpose(perm = transpose_148_perm_0, x = mul_21_cast_fp16)[name = string("transpose_279")]; tensor matmul_10_cast_fp16 = matmul(transpose_x = matmul_10_transpose_x_0, transpose_y = matmul_10_transpose_y_0, x = transpose_148, y = transpose_149)[name = string("matmul_10_cast_fp16")]; tensor add_10_cast_fp16 = add(x = matmul_10_cast_fp16, y = mul_0_to_fp16)[name = string("add_10_cast_fp16")]; int32 softmax_10_axis_0 = const()[name = string("softmax_10_axis_0"), val = int32(-1)]; tensor softmax_10_cast_fp16 = softmax(axis = softmax_10_axis_0, x = add_10_cast_fp16)[name = string("softmax_10_cast_fp16")]; bool attn_output_41_transpose_x_0 = const()[name = string("attn_output_41_transpose_x_0"), val = bool(false)]; bool attn_output_41_transpose_y_0 = const()[name = string("attn_output_41_transpose_y_0"), val = bool(false)]; tensor value_21_cast_fp16 = transpose(perm = value_21_perm_0, x = var_692_cast_fp16)[name = string("transpose_277")]; tensor attn_output_41_cast_fp16 = matmul(transpose_x = attn_output_41_transpose_x_0, transpose_y = attn_output_41_transpose_y_0, x = softmax_10_cast_fp16, y = value_21_cast_fp16)[name = string("attn_output_41_cast_fp16")]; tensor var_695_perm_0 = const()[name = string("op_695_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_697 = const()[name = string("op_697"), val = tensor([1, 77, -1])]; tensor var_695_cast_fp16 = transpose(perm = var_695_perm_0, x = attn_output_41_cast_fp16)[name = string("transpose_276")]; tensor var_698_cast_fp16 = reshape(shape = var_697, x = var_695_cast_fp16)[name = string("op_698_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(200491392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(201720256))))[name = string("encoder_text_model_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(201730560)))]; tensor linear_63_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_self_attn_out_proj_weight_to_fp16_palettized, x = var_698_cast_fp16)[name = string("linear_63_cast_fp16")]; tensor input_127_cast_fp16 = add(x = input_123_cast_fp16, y = linear_63_cast_fp16)[name = string("input_127_cast_fp16")]; tensor input_129_axes_0 = const()[name = string("input_129_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_10_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(201733184)))]; tensor encoder_text_model_encoder_layers_10_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(201735808)))]; tensor input_129_cast_fp16 = layer_norm(axes = input_129_axes_0, beta = encoder_text_model_encoder_layers_10_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_10_layer_norm2_weight_to_fp16, x = input_127_cast_fp16)[name = string("input_129_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(201738432))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(206653696))))[name = string("encoder_text_model_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(206694720)))]; tensor linear_64_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_mlp_fc1_weight_to_fp16_palettized, x = input_129_cast_fp16)[name = string("linear_64_cast_fp16")]; string input_133_mode_0 = const()[name = string("input_133_mode_0"), val = string("EXACT")]; tensor input_133_cast_fp16 = gelu(mode = input_133_mode_0, x = linear_64_cast_fp16)[name = string("input_133_cast_fp16")]; tensor encoder_text_model_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(206705024))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(211620288))))[name = string("encoder_text_model_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_10_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_10_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(211630592)))]; tensor linear_65_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_10_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_10_mlp_fc2_weight_to_fp16_palettized, x = input_133_cast_fp16)[name = string("linear_65_cast_fp16")]; tensor input_135_cast_fp16 = add(x = input_127_cast_fp16, y = linear_65_cast_fp16)[name = string("input_135_cast_fp16")]; tensor hidden_states_67_axes_0 = const()[name = string("hidden_states_67_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_11_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(211633216)))]; tensor encoder_text_model_encoder_layers_11_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(211635840)))]; tensor hidden_states_67_cast_fp16 = layer_norm(axes = hidden_states_67_axes_0, beta = encoder_text_model_encoder_layers_11_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_11_layer_norm1_weight_to_fp16, x = input_135_cast_fp16)[name = string("hidden_states_67_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(211638464))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(212867328))))[name = string("encoder_text_model_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(212877632)))]; tensor linear_66_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_66_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(212880256))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(214109120))))[name = string("encoder_text_model_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(214119424)))]; tensor linear_67_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_67_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(214122048))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(215350912))))[name = string("encoder_text_model_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(215361216)))]; tensor linear_68_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_67_cast_fp16)[name = string("linear_68_cast_fp16")]; tensor var_741 = const()[name = string("op_741"), val = tensor([1, 77, -1, 64])]; tensor var_742_cast_fp16 = reshape(shape = var_741, x = linear_66_cast_fp16)[name = string("op_742_cast_fp16")]; tensor var_744 = const()[name = string("op_744"), val = tensor([1, 77, -1, 64])]; tensor var_745_cast_fp16 = reshape(shape = var_744, x = linear_67_cast_fp16)[name = string("op_745_cast_fp16")]; tensor var_747 = const()[name = string("op_747"), val = tensor([1, 77, -1, 64])]; tensor var_748_cast_fp16 = reshape(shape = var_747, x = linear_68_cast_fp16)[name = string("op_748_cast_fp16")]; tensor value_23_perm_0 = const()[name = string("value_23_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_23_cast_fp16 = mul(x = var_742_cast_fp16, y = var_11_to_fp16)[name = string("mul_23_cast_fp16")]; bool matmul_11_transpose_y_0 = const()[name = string("matmul_11_transpose_y_0"), val = bool(true)]; bool matmul_11_transpose_x_0 = const()[name = string("matmul_11_transpose_x_0"), val = bool(false)]; tensor transpose_150_perm_0 = const()[name = string("transpose_150_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_151_perm_0 = const()[name = string("transpose_151_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_151 = transpose(perm = transpose_151_perm_0, x = var_745_cast_fp16)[name = string("transpose_274")]; tensor transpose_150 = transpose(perm = transpose_150_perm_0, x = mul_23_cast_fp16)[name = string("transpose_275")]; tensor matmul_11_cast_fp16 = matmul(transpose_x = matmul_11_transpose_x_0, transpose_y = matmul_11_transpose_y_0, x = transpose_150, y = transpose_151)[name = string("matmul_11_cast_fp16")]; tensor add_11_cast_fp16 = add(x = matmul_11_cast_fp16, y = mul_0_to_fp16)[name = string("add_11_cast_fp16")]; int32 softmax_11_axis_0 = const()[name = string("softmax_11_axis_0"), val = int32(-1)]; tensor softmax_11_cast_fp16 = softmax(axis = softmax_11_axis_0, x = add_11_cast_fp16)[name = string("softmax_11_cast_fp16")]; bool attn_output_45_transpose_x_0 = const()[name = string("attn_output_45_transpose_x_0"), val = bool(false)]; bool attn_output_45_transpose_y_0 = const()[name = string("attn_output_45_transpose_y_0"), val = bool(false)]; tensor value_23_cast_fp16 = transpose(perm = value_23_perm_0, x = var_748_cast_fp16)[name = string("transpose_273")]; tensor attn_output_45_cast_fp16 = matmul(transpose_x = attn_output_45_transpose_x_0, transpose_y = attn_output_45_transpose_y_0, x = softmax_11_cast_fp16, y = value_23_cast_fp16)[name = string("attn_output_45_cast_fp16")]; tensor var_751_perm_0 = const()[name = string("op_751_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_753 = const()[name = string("op_753"), val = tensor([1, 77, -1])]; tensor var_751_cast_fp16 = transpose(perm = var_751_perm_0, x = attn_output_45_cast_fp16)[name = string("transpose_272")]; tensor var_754_cast_fp16 = reshape(shape = var_753, x = var_751_cast_fp16)[name = string("op_754_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(215363840))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(216592704))))[name = string("encoder_text_model_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(216603008)))]; tensor linear_69_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_self_attn_out_proj_weight_to_fp16_palettized, x = var_754_cast_fp16)[name = string("linear_69_cast_fp16")]; tensor input_139_cast_fp16 = add(x = input_135_cast_fp16, y = linear_69_cast_fp16)[name = string("input_139_cast_fp16")]; tensor input_141_axes_0 = const()[name = string("input_141_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_11_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(216605632)))]; tensor encoder_text_model_encoder_layers_11_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(216608256)))]; tensor input_141_cast_fp16 = layer_norm(axes = input_141_axes_0, beta = encoder_text_model_encoder_layers_11_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_11_layer_norm2_weight_to_fp16, x = input_139_cast_fp16)[name = string("input_141_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(216610880))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(221526144))))[name = string("encoder_text_model_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(221567168)))]; tensor linear_70_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_mlp_fc1_weight_to_fp16_palettized, x = input_141_cast_fp16)[name = string("linear_70_cast_fp16")]; string input_145_mode_0 = const()[name = string("input_145_mode_0"), val = string("EXACT")]; tensor input_145_cast_fp16 = gelu(mode = input_145_mode_0, x = linear_70_cast_fp16)[name = string("input_145_cast_fp16")]; tensor encoder_text_model_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(221577472))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(226492736))))[name = string("encoder_text_model_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_11_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_11_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(226503040)))]; tensor linear_71_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_11_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_11_mlp_fc2_weight_to_fp16_palettized, x = input_145_cast_fp16)[name = string("linear_71_cast_fp16")]; tensor input_147_cast_fp16 = add(x = input_139_cast_fp16, y = linear_71_cast_fp16)[name = string("input_147_cast_fp16")]; tensor hidden_states_73_axes_0 = const()[name = string("hidden_states_73_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_12_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(226505664)))]; tensor encoder_text_model_encoder_layers_12_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(226508288)))]; tensor hidden_states_73_cast_fp16 = layer_norm(axes = hidden_states_73_axes_0, beta = encoder_text_model_encoder_layers_12_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_12_layer_norm1_weight_to_fp16, x = input_147_cast_fp16)[name = string("hidden_states_73_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(226510912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(227739776))))[name = string("encoder_text_model_encoder_layers_12_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(227750080)))]; tensor linear_72_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_73_cast_fp16)[name = string("linear_72_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(227752704))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(228981568))))[name = string("encoder_text_model_encoder_layers_12_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(228991872)))]; tensor linear_73_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_73_cast_fp16)[name = string("linear_73_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(228994496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(230223360))))[name = string("encoder_text_model_encoder_layers_12_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(230233664)))]; tensor linear_74_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_73_cast_fp16)[name = string("linear_74_cast_fp16")]; tensor var_797 = const()[name = string("op_797"), val = tensor([1, 77, -1, 64])]; tensor var_798_cast_fp16 = reshape(shape = var_797, x = linear_72_cast_fp16)[name = string("op_798_cast_fp16")]; tensor var_800 = const()[name = string("op_800"), val = tensor([1, 77, -1, 64])]; tensor var_801_cast_fp16 = reshape(shape = var_800, x = linear_73_cast_fp16)[name = string("op_801_cast_fp16")]; tensor var_803 = const()[name = string("op_803"), val = tensor([1, 77, -1, 64])]; tensor var_804_cast_fp16 = reshape(shape = var_803, x = linear_74_cast_fp16)[name = string("op_804_cast_fp16")]; tensor value_25_perm_0 = const()[name = string("value_25_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_25_cast_fp16 = mul(x = var_798_cast_fp16, y = var_11_to_fp16)[name = string("mul_25_cast_fp16")]; bool matmul_12_transpose_y_0 = const()[name = string("matmul_12_transpose_y_0"), val = bool(true)]; bool matmul_12_transpose_x_0 = const()[name = string("matmul_12_transpose_x_0"), val = bool(false)]; tensor transpose_152_perm_0 = const()[name = string("transpose_152_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_153_perm_0 = const()[name = string("transpose_153_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_153 = transpose(perm = transpose_153_perm_0, x = var_801_cast_fp16)[name = string("transpose_270")]; tensor transpose_152 = transpose(perm = transpose_152_perm_0, x = mul_25_cast_fp16)[name = string("transpose_271")]; tensor matmul_12_cast_fp16 = matmul(transpose_x = matmul_12_transpose_x_0, transpose_y = matmul_12_transpose_y_0, x = transpose_152, y = transpose_153)[name = string("matmul_12_cast_fp16")]; tensor add_12_cast_fp16 = add(x = matmul_12_cast_fp16, y = mul_0_to_fp16)[name = string("add_12_cast_fp16")]; int32 softmax_12_axis_0 = const()[name = string("softmax_12_axis_0"), val = int32(-1)]; tensor softmax_12_cast_fp16 = softmax(axis = softmax_12_axis_0, x = add_12_cast_fp16)[name = string("softmax_12_cast_fp16")]; bool attn_output_49_transpose_x_0 = const()[name = string("attn_output_49_transpose_x_0"), val = bool(false)]; bool attn_output_49_transpose_y_0 = const()[name = string("attn_output_49_transpose_y_0"), val = bool(false)]; tensor value_25_cast_fp16 = transpose(perm = value_25_perm_0, x = var_804_cast_fp16)[name = string("transpose_269")]; tensor attn_output_49_cast_fp16 = matmul(transpose_x = attn_output_49_transpose_x_0, transpose_y = attn_output_49_transpose_y_0, x = softmax_12_cast_fp16, y = value_25_cast_fp16)[name = string("attn_output_49_cast_fp16")]; tensor var_807_perm_0 = const()[name = string("op_807_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_809 = const()[name = string("op_809"), val = tensor([1, 77, -1])]; tensor var_807_cast_fp16 = transpose(perm = var_807_perm_0, x = attn_output_49_cast_fp16)[name = string("transpose_268")]; tensor var_810_cast_fp16 = reshape(shape = var_809, x = var_807_cast_fp16)[name = string("op_810_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(230236288))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(231465152))))[name = string("encoder_text_model_encoder_layers_12_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(231475456)))]; tensor linear_75_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_self_attn_out_proj_weight_to_fp16_palettized, x = var_810_cast_fp16)[name = string("linear_75_cast_fp16")]; tensor input_151_cast_fp16 = add(x = input_147_cast_fp16, y = linear_75_cast_fp16)[name = string("input_151_cast_fp16")]; tensor input_153_axes_0 = const()[name = string("input_153_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_12_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(231478080)))]; tensor encoder_text_model_encoder_layers_12_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(231480704)))]; tensor input_153_cast_fp16 = layer_norm(axes = input_153_axes_0, beta = encoder_text_model_encoder_layers_12_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_12_layer_norm2_weight_to_fp16, x = input_151_cast_fp16)[name = string("input_153_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(231483328))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(236398592))))[name = string("encoder_text_model_encoder_layers_12_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(236439616)))]; tensor linear_76_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_mlp_fc1_weight_to_fp16_palettized, x = input_153_cast_fp16)[name = string("linear_76_cast_fp16")]; string input_157_mode_0 = const()[name = string("input_157_mode_0"), val = string("EXACT")]; tensor input_157_cast_fp16 = gelu(mode = input_157_mode_0, x = linear_76_cast_fp16)[name = string("input_157_cast_fp16")]; tensor encoder_text_model_encoder_layers_12_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(236449920))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(241365184))))[name = string("encoder_text_model_encoder_layers_12_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_12_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_12_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(241375488)))]; tensor linear_77_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_12_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_12_mlp_fc2_weight_to_fp16_palettized, x = input_157_cast_fp16)[name = string("linear_77_cast_fp16")]; tensor input_159_cast_fp16 = add(x = input_151_cast_fp16, y = linear_77_cast_fp16)[name = string("input_159_cast_fp16")]; tensor hidden_states_79_axes_0 = const()[name = string("hidden_states_79_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_13_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(241378112)))]; tensor encoder_text_model_encoder_layers_13_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(241380736)))]; tensor hidden_states_79_cast_fp16 = layer_norm(axes = hidden_states_79_axes_0, beta = encoder_text_model_encoder_layers_13_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_13_layer_norm1_weight_to_fp16, x = input_159_cast_fp16)[name = string("hidden_states_79_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(241383360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(242612224))))[name = string("encoder_text_model_encoder_layers_13_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(242622528)))]; tensor linear_78_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_79_cast_fp16)[name = string("linear_78_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(242625152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(243854016))))[name = string("encoder_text_model_encoder_layers_13_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(243864320)))]; tensor linear_79_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_79_cast_fp16)[name = string("linear_79_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(243866944))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(245095808))))[name = string("encoder_text_model_encoder_layers_13_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(245106112)))]; tensor linear_80_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_79_cast_fp16)[name = string("linear_80_cast_fp16")]; tensor var_853 = const()[name = string("op_853"), val = tensor([1, 77, -1, 64])]; tensor var_854_cast_fp16 = reshape(shape = var_853, x = linear_78_cast_fp16)[name = string("op_854_cast_fp16")]; tensor var_856 = const()[name = string("op_856"), val = tensor([1, 77, -1, 64])]; tensor var_857_cast_fp16 = reshape(shape = var_856, x = linear_79_cast_fp16)[name = string("op_857_cast_fp16")]; tensor var_859 = const()[name = string("op_859"), val = tensor([1, 77, -1, 64])]; tensor var_860_cast_fp16 = reshape(shape = var_859, x = linear_80_cast_fp16)[name = string("op_860_cast_fp16")]; tensor value_27_perm_0 = const()[name = string("value_27_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_27_cast_fp16 = mul(x = var_854_cast_fp16, y = var_11_to_fp16)[name = string("mul_27_cast_fp16")]; bool matmul_13_transpose_y_0 = const()[name = string("matmul_13_transpose_y_0"), val = bool(true)]; bool matmul_13_transpose_x_0 = const()[name = string("matmul_13_transpose_x_0"), val = bool(false)]; tensor transpose_154_perm_0 = const()[name = string("transpose_154_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_155_perm_0 = const()[name = string("transpose_155_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_155 = transpose(perm = transpose_155_perm_0, x = var_857_cast_fp16)[name = string("transpose_266")]; tensor transpose_154 = transpose(perm = transpose_154_perm_0, x = mul_27_cast_fp16)[name = string("transpose_267")]; tensor matmul_13_cast_fp16 = matmul(transpose_x = matmul_13_transpose_x_0, transpose_y = matmul_13_transpose_y_0, x = transpose_154, y = transpose_155)[name = string("matmul_13_cast_fp16")]; tensor add_13_cast_fp16 = add(x = matmul_13_cast_fp16, y = mul_0_to_fp16)[name = string("add_13_cast_fp16")]; int32 softmax_13_axis_0 = const()[name = string("softmax_13_axis_0"), val = int32(-1)]; tensor softmax_13_cast_fp16 = softmax(axis = softmax_13_axis_0, x = add_13_cast_fp16)[name = string("softmax_13_cast_fp16")]; bool attn_output_53_transpose_x_0 = const()[name = string("attn_output_53_transpose_x_0"), val = bool(false)]; bool attn_output_53_transpose_y_0 = const()[name = string("attn_output_53_transpose_y_0"), val = bool(false)]; tensor value_27_cast_fp16 = transpose(perm = value_27_perm_0, x = var_860_cast_fp16)[name = string("transpose_265")]; tensor attn_output_53_cast_fp16 = matmul(transpose_x = attn_output_53_transpose_x_0, transpose_y = attn_output_53_transpose_y_0, x = softmax_13_cast_fp16, y = value_27_cast_fp16)[name = string("attn_output_53_cast_fp16")]; tensor var_863_perm_0 = const()[name = string("op_863_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_865 = const()[name = string("op_865"), val = tensor([1, 77, -1])]; tensor var_863_cast_fp16 = transpose(perm = var_863_perm_0, x = attn_output_53_cast_fp16)[name = string("transpose_264")]; tensor var_866_cast_fp16 = reshape(shape = var_865, x = var_863_cast_fp16)[name = string("op_866_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(245108736))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(246337600))))[name = string("encoder_text_model_encoder_layers_13_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(246347904)))]; tensor linear_81_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_self_attn_out_proj_weight_to_fp16_palettized, x = var_866_cast_fp16)[name = string("linear_81_cast_fp16")]; tensor input_163_cast_fp16 = add(x = input_159_cast_fp16, y = linear_81_cast_fp16)[name = string("input_163_cast_fp16")]; tensor input_165_axes_0 = const()[name = string("input_165_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_13_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(246350528)))]; tensor encoder_text_model_encoder_layers_13_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(246353152)))]; tensor input_165_cast_fp16 = layer_norm(axes = input_165_axes_0, beta = encoder_text_model_encoder_layers_13_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_13_layer_norm2_weight_to_fp16, x = input_163_cast_fp16)[name = string("input_165_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(246355776))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(251271040))))[name = string("encoder_text_model_encoder_layers_13_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(251312064)))]; tensor linear_82_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_mlp_fc1_weight_to_fp16_palettized, x = input_165_cast_fp16)[name = string("linear_82_cast_fp16")]; string input_169_mode_0 = const()[name = string("input_169_mode_0"), val = string("EXACT")]; tensor input_169_cast_fp16 = gelu(mode = input_169_mode_0, x = linear_82_cast_fp16)[name = string("input_169_cast_fp16")]; tensor encoder_text_model_encoder_layers_13_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(251322368))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(256237632))))[name = string("encoder_text_model_encoder_layers_13_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_13_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_13_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(256247936)))]; tensor linear_83_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_13_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_13_mlp_fc2_weight_to_fp16_palettized, x = input_169_cast_fp16)[name = string("linear_83_cast_fp16")]; tensor input_171_cast_fp16 = add(x = input_163_cast_fp16, y = linear_83_cast_fp16)[name = string("input_171_cast_fp16")]; tensor hidden_states_85_axes_0 = const()[name = string("hidden_states_85_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_14_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(256250560)))]; tensor encoder_text_model_encoder_layers_14_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(256253184)))]; tensor hidden_states_85_cast_fp16 = layer_norm(axes = hidden_states_85_axes_0, beta = encoder_text_model_encoder_layers_14_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_14_layer_norm1_weight_to_fp16, x = input_171_cast_fp16)[name = string("hidden_states_85_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(256255808))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(257484672))))[name = string("encoder_text_model_encoder_layers_14_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(257494976)))]; tensor linear_84_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_85_cast_fp16)[name = string("linear_84_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(257497600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(258726464))))[name = string("encoder_text_model_encoder_layers_14_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(258736768)))]; tensor linear_85_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_85_cast_fp16)[name = string("linear_85_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(258739392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(259968256))))[name = string("encoder_text_model_encoder_layers_14_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(259978560)))]; tensor linear_86_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_85_cast_fp16)[name = string("linear_86_cast_fp16")]; tensor var_909 = const()[name = string("op_909"), val = tensor([1, 77, -1, 64])]; tensor var_910_cast_fp16 = reshape(shape = var_909, x = linear_84_cast_fp16)[name = string("op_910_cast_fp16")]; tensor var_912 = const()[name = string("op_912"), val = tensor([1, 77, -1, 64])]; tensor var_913_cast_fp16 = reshape(shape = var_912, x = linear_85_cast_fp16)[name = string("op_913_cast_fp16")]; tensor var_915 = const()[name = string("op_915"), val = tensor([1, 77, -1, 64])]; tensor var_916_cast_fp16 = reshape(shape = var_915, x = linear_86_cast_fp16)[name = string("op_916_cast_fp16")]; tensor value_29_perm_0 = const()[name = string("value_29_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_29_cast_fp16 = mul(x = var_910_cast_fp16, y = var_11_to_fp16)[name = string("mul_29_cast_fp16")]; bool matmul_14_transpose_y_0 = const()[name = string("matmul_14_transpose_y_0"), val = bool(true)]; bool matmul_14_transpose_x_0 = const()[name = string("matmul_14_transpose_x_0"), val = bool(false)]; tensor transpose_156_perm_0 = const()[name = string("transpose_156_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_157_perm_0 = const()[name = string("transpose_157_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_157 = transpose(perm = transpose_157_perm_0, x = var_913_cast_fp16)[name = string("transpose_262")]; tensor transpose_156 = transpose(perm = transpose_156_perm_0, x = mul_29_cast_fp16)[name = string("transpose_263")]; tensor matmul_14_cast_fp16 = matmul(transpose_x = matmul_14_transpose_x_0, transpose_y = matmul_14_transpose_y_0, x = transpose_156, y = transpose_157)[name = string("matmul_14_cast_fp16")]; tensor add_14_cast_fp16 = add(x = matmul_14_cast_fp16, y = mul_0_to_fp16)[name = string("add_14_cast_fp16")]; int32 softmax_14_axis_0 = const()[name = string("softmax_14_axis_0"), val = int32(-1)]; tensor softmax_14_cast_fp16 = softmax(axis = softmax_14_axis_0, x = add_14_cast_fp16)[name = string("softmax_14_cast_fp16")]; bool attn_output_57_transpose_x_0 = const()[name = string("attn_output_57_transpose_x_0"), val = bool(false)]; bool attn_output_57_transpose_y_0 = const()[name = string("attn_output_57_transpose_y_0"), val = bool(false)]; tensor value_29_cast_fp16 = transpose(perm = value_29_perm_0, x = var_916_cast_fp16)[name = string("transpose_261")]; tensor attn_output_57_cast_fp16 = matmul(transpose_x = attn_output_57_transpose_x_0, transpose_y = attn_output_57_transpose_y_0, x = softmax_14_cast_fp16, y = value_29_cast_fp16)[name = string("attn_output_57_cast_fp16")]; tensor var_919_perm_0 = const()[name = string("op_919_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_921 = const()[name = string("op_921"), val = tensor([1, 77, -1])]; tensor var_919_cast_fp16 = transpose(perm = var_919_perm_0, x = attn_output_57_cast_fp16)[name = string("transpose_260")]; tensor var_922_cast_fp16 = reshape(shape = var_921, x = var_919_cast_fp16)[name = string("op_922_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(259981184))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(261210048))))[name = string("encoder_text_model_encoder_layers_14_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(261220352)))]; tensor linear_87_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_self_attn_out_proj_weight_to_fp16_palettized, x = var_922_cast_fp16)[name = string("linear_87_cast_fp16")]; tensor input_175_cast_fp16 = add(x = input_171_cast_fp16, y = linear_87_cast_fp16)[name = string("input_175_cast_fp16")]; tensor input_177_axes_0 = const()[name = string("input_177_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_14_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(261222976)))]; tensor encoder_text_model_encoder_layers_14_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(261225600)))]; tensor input_177_cast_fp16 = layer_norm(axes = input_177_axes_0, beta = encoder_text_model_encoder_layers_14_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_14_layer_norm2_weight_to_fp16, x = input_175_cast_fp16)[name = string("input_177_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(261228224))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(266143488))))[name = string("encoder_text_model_encoder_layers_14_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(266184512)))]; tensor linear_88_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_mlp_fc1_weight_to_fp16_palettized, x = input_177_cast_fp16)[name = string("linear_88_cast_fp16")]; string input_181_mode_0 = const()[name = string("input_181_mode_0"), val = string("EXACT")]; tensor input_181_cast_fp16 = gelu(mode = input_181_mode_0, x = linear_88_cast_fp16)[name = string("input_181_cast_fp16")]; tensor encoder_text_model_encoder_layers_14_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(266194816))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(271110080))))[name = string("encoder_text_model_encoder_layers_14_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_14_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_14_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(271120384)))]; tensor linear_89_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_14_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_14_mlp_fc2_weight_to_fp16_palettized, x = input_181_cast_fp16)[name = string("linear_89_cast_fp16")]; tensor input_183_cast_fp16 = add(x = input_175_cast_fp16, y = linear_89_cast_fp16)[name = string("input_183_cast_fp16")]; tensor hidden_states_91_axes_0 = const()[name = string("hidden_states_91_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_15_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(271123008)))]; tensor encoder_text_model_encoder_layers_15_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(271125632)))]; tensor hidden_states_91_cast_fp16 = layer_norm(axes = hidden_states_91_axes_0, beta = encoder_text_model_encoder_layers_15_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_15_layer_norm1_weight_to_fp16, x = input_183_cast_fp16)[name = string("hidden_states_91_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(271128256))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(272357120))))[name = string("encoder_text_model_encoder_layers_15_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(272367424)))]; tensor linear_90_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_91_cast_fp16)[name = string("linear_90_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(272370048))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(273598912))))[name = string("encoder_text_model_encoder_layers_15_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(273609216)))]; tensor linear_91_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_91_cast_fp16)[name = string("linear_91_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(273611840))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(274840704))))[name = string("encoder_text_model_encoder_layers_15_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(274851008)))]; tensor linear_92_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_91_cast_fp16)[name = string("linear_92_cast_fp16")]; tensor var_965 = const()[name = string("op_965"), val = tensor([1, 77, -1, 64])]; tensor var_966_cast_fp16 = reshape(shape = var_965, x = linear_90_cast_fp16)[name = string("op_966_cast_fp16")]; tensor var_968 = const()[name = string("op_968"), val = tensor([1, 77, -1, 64])]; tensor var_969_cast_fp16 = reshape(shape = var_968, x = linear_91_cast_fp16)[name = string("op_969_cast_fp16")]; tensor var_971 = const()[name = string("op_971"), val = tensor([1, 77, -1, 64])]; tensor var_972_cast_fp16 = reshape(shape = var_971, x = linear_92_cast_fp16)[name = string("op_972_cast_fp16")]; tensor value_31_perm_0 = const()[name = string("value_31_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_31_cast_fp16 = mul(x = var_966_cast_fp16, y = var_11_to_fp16)[name = string("mul_31_cast_fp16")]; bool matmul_15_transpose_y_0 = const()[name = string("matmul_15_transpose_y_0"), val = bool(true)]; bool matmul_15_transpose_x_0 = const()[name = string("matmul_15_transpose_x_0"), val = bool(false)]; tensor transpose_158_perm_0 = const()[name = string("transpose_158_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_159_perm_0 = const()[name = string("transpose_159_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_159 = transpose(perm = transpose_159_perm_0, x = var_969_cast_fp16)[name = string("transpose_258")]; tensor transpose_158 = transpose(perm = transpose_158_perm_0, x = mul_31_cast_fp16)[name = string("transpose_259")]; tensor matmul_15_cast_fp16 = matmul(transpose_x = matmul_15_transpose_x_0, transpose_y = matmul_15_transpose_y_0, x = transpose_158, y = transpose_159)[name = string("matmul_15_cast_fp16")]; tensor add_15_cast_fp16 = add(x = matmul_15_cast_fp16, y = mul_0_to_fp16)[name = string("add_15_cast_fp16")]; int32 softmax_15_axis_0 = const()[name = string("softmax_15_axis_0"), val = int32(-1)]; tensor softmax_15_cast_fp16 = softmax(axis = softmax_15_axis_0, x = add_15_cast_fp16)[name = string("softmax_15_cast_fp16")]; bool attn_output_61_transpose_x_0 = const()[name = string("attn_output_61_transpose_x_0"), val = bool(false)]; bool attn_output_61_transpose_y_0 = const()[name = string("attn_output_61_transpose_y_0"), val = bool(false)]; tensor value_31_cast_fp16 = transpose(perm = value_31_perm_0, x = var_972_cast_fp16)[name = string("transpose_257")]; tensor attn_output_61_cast_fp16 = matmul(transpose_x = attn_output_61_transpose_x_0, transpose_y = attn_output_61_transpose_y_0, x = softmax_15_cast_fp16, y = value_31_cast_fp16)[name = string("attn_output_61_cast_fp16")]; tensor var_975_perm_0 = const()[name = string("op_975_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_977 = const()[name = string("op_977"), val = tensor([1, 77, -1])]; tensor var_975_cast_fp16 = transpose(perm = var_975_perm_0, x = attn_output_61_cast_fp16)[name = string("transpose_256")]; tensor var_978_cast_fp16 = reshape(shape = var_977, x = var_975_cast_fp16)[name = string("op_978_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(274853632))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(276082496))))[name = string("encoder_text_model_encoder_layers_15_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(276092800)))]; tensor linear_93_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_self_attn_out_proj_weight_to_fp16_palettized, x = var_978_cast_fp16)[name = string("linear_93_cast_fp16")]; tensor input_187_cast_fp16 = add(x = input_183_cast_fp16, y = linear_93_cast_fp16)[name = string("input_187_cast_fp16")]; tensor input_189_axes_0 = const()[name = string("input_189_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_15_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(276095424)))]; tensor encoder_text_model_encoder_layers_15_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(276098048)))]; tensor input_189_cast_fp16 = layer_norm(axes = input_189_axes_0, beta = encoder_text_model_encoder_layers_15_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_15_layer_norm2_weight_to_fp16, x = input_187_cast_fp16)[name = string("input_189_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(276100672))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(281015936))))[name = string("encoder_text_model_encoder_layers_15_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(281056960)))]; tensor linear_94_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_mlp_fc1_weight_to_fp16_palettized, x = input_189_cast_fp16)[name = string("linear_94_cast_fp16")]; string input_193_mode_0 = const()[name = string("input_193_mode_0"), val = string("EXACT")]; tensor input_193_cast_fp16 = gelu(mode = input_193_mode_0, x = linear_94_cast_fp16)[name = string("input_193_cast_fp16")]; tensor encoder_text_model_encoder_layers_15_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(281067264))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(285982528))))[name = string("encoder_text_model_encoder_layers_15_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_15_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_15_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(285992832)))]; tensor linear_95_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_15_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_15_mlp_fc2_weight_to_fp16_palettized, x = input_193_cast_fp16)[name = string("linear_95_cast_fp16")]; tensor input_195_cast_fp16 = add(x = input_187_cast_fp16, y = linear_95_cast_fp16)[name = string("input_195_cast_fp16")]; tensor hidden_states_97_axes_0 = const()[name = string("hidden_states_97_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_16_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(285995456)))]; tensor encoder_text_model_encoder_layers_16_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(285998080)))]; tensor hidden_states_97_cast_fp16 = layer_norm(axes = hidden_states_97_axes_0, beta = encoder_text_model_encoder_layers_16_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_16_layer_norm1_weight_to_fp16, x = input_195_cast_fp16)[name = string("hidden_states_97_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(286000704))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(287229568))))[name = string("encoder_text_model_encoder_layers_16_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(287239872)))]; tensor linear_96_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_97_cast_fp16)[name = string("linear_96_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(287242496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(288471360))))[name = string("encoder_text_model_encoder_layers_16_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(288481664)))]; tensor linear_97_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_97_cast_fp16)[name = string("linear_97_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(288484288))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(289713152))))[name = string("encoder_text_model_encoder_layers_16_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(289723456)))]; tensor linear_98_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_97_cast_fp16)[name = string("linear_98_cast_fp16")]; tensor var_1021 = const()[name = string("op_1021"), val = tensor([1, 77, -1, 64])]; tensor var_1022_cast_fp16 = reshape(shape = var_1021, x = linear_96_cast_fp16)[name = string("op_1022_cast_fp16")]; tensor var_1024 = const()[name = string("op_1024"), val = tensor([1, 77, -1, 64])]; tensor var_1025_cast_fp16 = reshape(shape = var_1024, x = linear_97_cast_fp16)[name = string("op_1025_cast_fp16")]; tensor var_1027 = const()[name = string("op_1027"), val = tensor([1, 77, -1, 64])]; tensor var_1028_cast_fp16 = reshape(shape = var_1027, x = linear_98_cast_fp16)[name = string("op_1028_cast_fp16")]; tensor value_33_perm_0 = const()[name = string("value_33_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_33_cast_fp16 = mul(x = var_1022_cast_fp16, y = var_11_to_fp16)[name = string("mul_33_cast_fp16")]; bool matmul_16_transpose_y_0 = const()[name = string("matmul_16_transpose_y_0"), val = bool(true)]; bool matmul_16_transpose_x_0 = const()[name = string("matmul_16_transpose_x_0"), val = bool(false)]; tensor transpose_160_perm_0 = const()[name = string("transpose_160_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_161_perm_0 = const()[name = string("transpose_161_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_161 = transpose(perm = transpose_161_perm_0, x = var_1025_cast_fp16)[name = string("transpose_254")]; tensor transpose_160 = transpose(perm = transpose_160_perm_0, x = mul_33_cast_fp16)[name = string("transpose_255")]; tensor matmul_16_cast_fp16 = matmul(transpose_x = matmul_16_transpose_x_0, transpose_y = matmul_16_transpose_y_0, x = transpose_160, y = transpose_161)[name = string("matmul_16_cast_fp16")]; tensor add_16_cast_fp16 = add(x = matmul_16_cast_fp16, y = mul_0_to_fp16)[name = string("add_16_cast_fp16")]; int32 softmax_16_axis_0 = const()[name = string("softmax_16_axis_0"), val = int32(-1)]; tensor softmax_16_cast_fp16 = softmax(axis = softmax_16_axis_0, x = add_16_cast_fp16)[name = string("softmax_16_cast_fp16")]; bool attn_output_65_transpose_x_0 = const()[name = string("attn_output_65_transpose_x_0"), val = bool(false)]; bool attn_output_65_transpose_y_0 = const()[name = string("attn_output_65_transpose_y_0"), val = bool(false)]; tensor value_33_cast_fp16 = transpose(perm = value_33_perm_0, x = var_1028_cast_fp16)[name = string("transpose_253")]; tensor attn_output_65_cast_fp16 = matmul(transpose_x = attn_output_65_transpose_x_0, transpose_y = attn_output_65_transpose_y_0, x = softmax_16_cast_fp16, y = value_33_cast_fp16)[name = string("attn_output_65_cast_fp16")]; tensor var_1031_perm_0 = const()[name = string("op_1031_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1033 = const()[name = string("op_1033"), val = tensor([1, 77, -1])]; tensor var_1031_cast_fp16 = transpose(perm = var_1031_perm_0, x = attn_output_65_cast_fp16)[name = string("transpose_252")]; tensor var_1034_cast_fp16 = reshape(shape = var_1033, x = var_1031_cast_fp16)[name = string("op_1034_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(289726080))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(290954944))))[name = string("encoder_text_model_encoder_layers_16_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(290965248)))]; tensor linear_99_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_self_attn_out_proj_weight_to_fp16_palettized, x = var_1034_cast_fp16)[name = string("linear_99_cast_fp16")]; tensor input_199_cast_fp16 = add(x = input_195_cast_fp16, y = linear_99_cast_fp16)[name = string("input_199_cast_fp16")]; tensor input_201_axes_0 = const()[name = string("input_201_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_16_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(290967872)))]; tensor encoder_text_model_encoder_layers_16_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(290970496)))]; tensor input_201_cast_fp16 = layer_norm(axes = input_201_axes_0, beta = encoder_text_model_encoder_layers_16_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_16_layer_norm2_weight_to_fp16, x = input_199_cast_fp16)[name = string("input_201_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(290973120))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(295888384))))[name = string("encoder_text_model_encoder_layers_16_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(295929408)))]; tensor linear_100_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_mlp_fc1_weight_to_fp16_palettized, x = input_201_cast_fp16)[name = string("linear_100_cast_fp16")]; string input_205_mode_0 = const()[name = string("input_205_mode_0"), val = string("EXACT")]; tensor input_205_cast_fp16 = gelu(mode = input_205_mode_0, x = linear_100_cast_fp16)[name = string("input_205_cast_fp16")]; tensor encoder_text_model_encoder_layers_16_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(295939712))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(300854976))))[name = string("encoder_text_model_encoder_layers_16_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_16_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_16_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(300865280)))]; tensor linear_101_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_16_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_16_mlp_fc2_weight_to_fp16_palettized, x = input_205_cast_fp16)[name = string("linear_101_cast_fp16")]; tensor input_207_cast_fp16 = add(x = input_199_cast_fp16, y = linear_101_cast_fp16)[name = string("input_207_cast_fp16")]; tensor hidden_states_103_axes_0 = const()[name = string("hidden_states_103_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_17_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(300867904)))]; tensor encoder_text_model_encoder_layers_17_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(300870528)))]; tensor hidden_states_103_cast_fp16 = layer_norm(axes = hidden_states_103_axes_0, beta = encoder_text_model_encoder_layers_17_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_17_layer_norm1_weight_to_fp16, x = input_207_cast_fp16)[name = string("hidden_states_103_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(300873152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(302102016))))[name = string("encoder_text_model_encoder_layers_17_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(302112320)))]; tensor linear_102_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_103_cast_fp16)[name = string("linear_102_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(302114944))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(303343808))))[name = string("encoder_text_model_encoder_layers_17_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(303354112)))]; tensor linear_103_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_103_cast_fp16)[name = string("linear_103_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(303356736))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(304585600))))[name = string("encoder_text_model_encoder_layers_17_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(304595904)))]; tensor linear_104_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_103_cast_fp16)[name = string("linear_104_cast_fp16")]; tensor var_1077 = const()[name = string("op_1077"), val = tensor([1, 77, -1, 64])]; tensor var_1078_cast_fp16 = reshape(shape = var_1077, x = linear_102_cast_fp16)[name = string("op_1078_cast_fp16")]; tensor var_1080 = const()[name = string("op_1080"), val = tensor([1, 77, -1, 64])]; tensor var_1081_cast_fp16 = reshape(shape = var_1080, x = linear_103_cast_fp16)[name = string("op_1081_cast_fp16")]; tensor var_1083 = const()[name = string("op_1083"), val = tensor([1, 77, -1, 64])]; tensor var_1084_cast_fp16 = reshape(shape = var_1083, x = linear_104_cast_fp16)[name = string("op_1084_cast_fp16")]; tensor value_35_perm_0 = const()[name = string("value_35_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_35_cast_fp16 = mul(x = var_1078_cast_fp16, y = var_11_to_fp16)[name = string("mul_35_cast_fp16")]; bool matmul_17_transpose_y_0 = const()[name = string("matmul_17_transpose_y_0"), val = bool(true)]; bool matmul_17_transpose_x_0 = const()[name = string("matmul_17_transpose_x_0"), val = bool(false)]; tensor transpose_162_perm_0 = const()[name = string("transpose_162_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_163_perm_0 = const()[name = string("transpose_163_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_163 = transpose(perm = transpose_163_perm_0, x = var_1081_cast_fp16)[name = string("transpose_250")]; tensor transpose_162 = transpose(perm = transpose_162_perm_0, x = mul_35_cast_fp16)[name = string("transpose_251")]; tensor matmul_17_cast_fp16 = matmul(transpose_x = matmul_17_transpose_x_0, transpose_y = matmul_17_transpose_y_0, x = transpose_162, y = transpose_163)[name = string("matmul_17_cast_fp16")]; tensor add_17_cast_fp16 = add(x = matmul_17_cast_fp16, y = mul_0_to_fp16)[name = string("add_17_cast_fp16")]; int32 softmax_17_axis_0 = const()[name = string("softmax_17_axis_0"), val = int32(-1)]; tensor softmax_17_cast_fp16 = softmax(axis = softmax_17_axis_0, x = add_17_cast_fp16)[name = string("softmax_17_cast_fp16")]; bool attn_output_69_transpose_x_0 = const()[name = string("attn_output_69_transpose_x_0"), val = bool(false)]; bool attn_output_69_transpose_y_0 = const()[name = string("attn_output_69_transpose_y_0"), val = bool(false)]; tensor value_35_cast_fp16 = transpose(perm = value_35_perm_0, x = var_1084_cast_fp16)[name = string("transpose_249")]; tensor attn_output_69_cast_fp16 = matmul(transpose_x = attn_output_69_transpose_x_0, transpose_y = attn_output_69_transpose_y_0, x = softmax_17_cast_fp16, y = value_35_cast_fp16)[name = string("attn_output_69_cast_fp16")]; tensor var_1087_perm_0 = const()[name = string("op_1087_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1089 = const()[name = string("op_1089"), val = tensor([1, 77, -1])]; tensor var_1087_cast_fp16 = transpose(perm = var_1087_perm_0, x = attn_output_69_cast_fp16)[name = string("transpose_248")]; tensor var_1090_cast_fp16 = reshape(shape = var_1089, x = var_1087_cast_fp16)[name = string("op_1090_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(304598528))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(305827392))))[name = string("encoder_text_model_encoder_layers_17_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(305837696)))]; tensor linear_105_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_self_attn_out_proj_weight_to_fp16_palettized, x = var_1090_cast_fp16)[name = string("linear_105_cast_fp16")]; tensor input_211_cast_fp16 = add(x = input_207_cast_fp16, y = linear_105_cast_fp16)[name = string("input_211_cast_fp16")]; tensor input_213_axes_0 = const()[name = string("input_213_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_17_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(305840320)))]; tensor encoder_text_model_encoder_layers_17_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(305842944)))]; tensor input_213_cast_fp16 = layer_norm(axes = input_213_axes_0, beta = encoder_text_model_encoder_layers_17_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_17_layer_norm2_weight_to_fp16, x = input_211_cast_fp16)[name = string("input_213_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(305845568))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(310760832))))[name = string("encoder_text_model_encoder_layers_17_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(310801856)))]; tensor linear_106_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_mlp_fc1_weight_to_fp16_palettized, x = input_213_cast_fp16)[name = string("linear_106_cast_fp16")]; string input_217_mode_0 = const()[name = string("input_217_mode_0"), val = string("EXACT")]; tensor input_217_cast_fp16 = gelu(mode = input_217_mode_0, x = linear_106_cast_fp16)[name = string("input_217_cast_fp16")]; tensor encoder_text_model_encoder_layers_17_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(310812160))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315727424))))[name = string("encoder_text_model_encoder_layers_17_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_17_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_17_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315737728)))]; tensor linear_107_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_17_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_17_mlp_fc2_weight_to_fp16_palettized, x = input_217_cast_fp16)[name = string("linear_107_cast_fp16")]; tensor input_219_cast_fp16 = add(x = input_211_cast_fp16, y = linear_107_cast_fp16)[name = string("input_219_cast_fp16")]; tensor hidden_states_109_axes_0 = const()[name = string("hidden_states_109_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_18_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315740352)))]; tensor encoder_text_model_encoder_layers_18_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315742976)))]; tensor hidden_states_109_cast_fp16 = layer_norm(axes = hidden_states_109_axes_0, beta = encoder_text_model_encoder_layers_18_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_18_layer_norm1_weight_to_fp16, x = input_219_cast_fp16)[name = string("hidden_states_109_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(315745600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(316974464))))[name = string("encoder_text_model_encoder_layers_18_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(316984768)))]; tensor linear_108_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_109_cast_fp16)[name = string("linear_108_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(316987392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(318216256))))[name = string("encoder_text_model_encoder_layers_18_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(318226560)))]; tensor linear_109_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_109_cast_fp16)[name = string("linear_109_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(318229184))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(319458048))))[name = string("encoder_text_model_encoder_layers_18_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(319468352)))]; tensor linear_110_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_109_cast_fp16)[name = string("linear_110_cast_fp16")]; tensor var_1133 = const()[name = string("op_1133"), val = tensor([1, 77, -1, 64])]; tensor var_1134_cast_fp16 = reshape(shape = var_1133, x = linear_108_cast_fp16)[name = string("op_1134_cast_fp16")]; tensor var_1136 = const()[name = string("op_1136"), val = tensor([1, 77, -1, 64])]; tensor var_1137_cast_fp16 = reshape(shape = var_1136, x = linear_109_cast_fp16)[name = string("op_1137_cast_fp16")]; tensor var_1139 = const()[name = string("op_1139"), val = tensor([1, 77, -1, 64])]; tensor var_1140_cast_fp16 = reshape(shape = var_1139, x = linear_110_cast_fp16)[name = string("op_1140_cast_fp16")]; tensor value_37_perm_0 = const()[name = string("value_37_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_37_cast_fp16 = mul(x = var_1134_cast_fp16, y = var_11_to_fp16)[name = string("mul_37_cast_fp16")]; bool matmul_18_transpose_y_0 = const()[name = string("matmul_18_transpose_y_0"), val = bool(true)]; bool matmul_18_transpose_x_0 = const()[name = string("matmul_18_transpose_x_0"), val = bool(false)]; tensor transpose_164_perm_0 = const()[name = string("transpose_164_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_165_perm_0 = const()[name = string("transpose_165_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_165 = transpose(perm = transpose_165_perm_0, x = var_1137_cast_fp16)[name = string("transpose_246")]; tensor transpose_164 = transpose(perm = transpose_164_perm_0, x = mul_37_cast_fp16)[name = string("transpose_247")]; tensor matmul_18_cast_fp16 = matmul(transpose_x = matmul_18_transpose_x_0, transpose_y = matmul_18_transpose_y_0, x = transpose_164, y = transpose_165)[name = string("matmul_18_cast_fp16")]; tensor add_18_cast_fp16 = add(x = matmul_18_cast_fp16, y = mul_0_to_fp16)[name = string("add_18_cast_fp16")]; int32 softmax_18_axis_0 = const()[name = string("softmax_18_axis_0"), val = int32(-1)]; tensor softmax_18_cast_fp16 = softmax(axis = softmax_18_axis_0, x = add_18_cast_fp16)[name = string("softmax_18_cast_fp16")]; bool attn_output_73_transpose_x_0 = const()[name = string("attn_output_73_transpose_x_0"), val = bool(false)]; bool attn_output_73_transpose_y_0 = const()[name = string("attn_output_73_transpose_y_0"), val = bool(false)]; tensor value_37_cast_fp16 = transpose(perm = value_37_perm_0, x = var_1140_cast_fp16)[name = string("transpose_245")]; tensor attn_output_73_cast_fp16 = matmul(transpose_x = attn_output_73_transpose_x_0, transpose_y = attn_output_73_transpose_y_0, x = softmax_18_cast_fp16, y = value_37_cast_fp16)[name = string("attn_output_73_cast_fp16")]; tensor var_1143_perm_0 = const()[name = string("op_1143_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1145 = const()[name = string("op_1145"), val = tensor([1, 77, -1])]; tensor var_1143_cast_fp16 = transpose(perm = var_1143_perm_0, x = attn_output_73_cast_fp16)[name = string("transpose_244")]; tensor var_1146_cast_fp16 = reshape(shape = var_1145, x = var_1143_cast_fp16)[name = string("op_1146_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(319470976))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(320699840))))[name = string("encoder_text_model_encoder_layers_18_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(320710144)))]; tensor linear_111_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_self_attn_out_proj_weight_to_fp16_palettized, x = var_1146_cast_fp16)[name = string("linear_111_cast_fp16")]; tensor input_223_cast_fp16 = add(x = input_219_cast_fp16, y = linear_111_cast_fp16)[name = string("input_223_cast_fp16")]; tensor input_225_axes_0 = const()[name = string("input_225_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_18_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(320712768)))]; tensor encoder_text_model_encoder_layers_18_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(320715392)))]; tensor input_225_cast_fp16 = layer_norm(axes = input_225_axes_0, beta = encoder_text_model_encoder_layers_18_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_18_layer_norm2_weight_to_fp16, x = input_223_cast_fp16)[name = string("input_225_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(320718016))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(325633280))))[name = string("encoder_text_model_encoder_layers_18_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(325674304)))]; tensor linear_112_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_mlp_fc1_weight_to_fp16_palettized, x = input_225_cast_fp16)[name = string("linear_112_cast_fp16")]; string input_229_mode_0 = const()[name = string("input_229_mode_0"), val = string("EXACT")]; tensor input_229_cast_fp16 = gelu(mode = input_229_mode_0, x = linear_112_cast_fp16)[name = string("input_229_cast_fp16")]; tensor encoder_text_model_encoder_layers_18_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(325684608))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(330599872))))[name = string("encoder_text_model_encoder_layers_18_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_18_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_18_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(330610176)))]; tensor linear_113_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_18_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_18_mlp_fc2_weight_to_fp16_palettized, x = input_229_cast_fp16)[name = string("linear_113_cast_fp16")]; tensor input_231_cast_fp16 = add(x = input_223_cast_fp16, y = linear_113_cast_fp16)[name = string("input_231_cast_fp16")]; tensor hidden_states_115_axes_0 = const()[name = string("hidden_states_115_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_19_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(330612800)))]; tensor encoder_text_model_encoder_layers_19_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(330615424)))]; tensor hidden_states_115_cast_fp16 = layer_norm(axes = hidden_states_115_axes_0, beta = encoder_text_model_encoder_layers_19_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_19_layer_norm1_weight_to_fp16, x = input_231_cast_fp16)[name = string("hidden_states_115_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(330618048))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(331846912))))[name = string("encoder_text_model_encoder_layers_19_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(331857216)))]; tensor linear_114_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_115_cast_fp16)[name = string("linear_114_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(331859840))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(333088704))))[name = string("encoder_text_model_encoder_layers_19_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(333099008)))]; tensor linear_115_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_115_cast_fp16)[name = string("linear_115_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(333101632))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(334330496))))[name = string("encoder_text_model_encoder_layers_19_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(334340800)))]; tensor linear_116_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_115_cast_fp16)[name = string("linear_116_cast_fp16")]; tensor var_1189 = const()[name = string("op_1189"), val = tensor([1, 77, -1, 64])]; tensor var_1190_cast_fp16 = reshape(shape = var_1189, x = linear_114_cast_fp16)[name = string("op_1190_cast_fp16")]; tensor var_1192 = const()[name = string("op_1192"), val = tensor([1, 77, -1, 64])]; tensor var_1193_cast_fp16 = reshape(shape = var_1192, x = linear_115_cast_fp16)[name = string("op_1193_cast_fp16")]; tensor var_1195 = const()[name = string("op_1195"), val = tensor([1, 77, -1, 64])]; tensor var_1196_cast_fp16 = reshape(shape = var_1195, x = linear_116_cast_fp16)[name = string("op_1196_cast_fp16")]; tensor value_39_perm_0 = const()[name = string("value_39_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_39_cast_fp16 = mul(x = var_1190_cast_fp16, y = var_11_to_fp16)[name = string("mul_39_cast_fp16")]; bool matmul_19_transpose_y_0 = const()[name = string("matmul_19_transpose_y_0"), val = bool(true)]; bool matmul_19_transpose_x_0 = const()[name = string("matmul_19_transpose_x_0"), val = bool(false)]; tensor transpose_166_perm_0 = const()[name = string("transpose_166_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_167_perm_0 = const()[name = string("transpose_167_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_167 = transpose(perm = transpose_167_perm_0, x = var_1193_cast_fp16)[name = string("transpose_242")]; tensor transpose_166 = transpose(perm = transpose_166_perm_0, x = mul_39_cast_fp16)[name = string("transpose_243")]; tensor matmul_19_cast_fp16 = matmul(transpose_x = matmul_19_transpose_x_0, transpose_y = matmul_19_transpose_y_0, x = transpose_166, y = transpose_167)[name = string("matmul_19_cast_fp16")]; tensor add_19_cast_fp16 = add(x = matmul_19_cast_fp16, y = mul_0_to_fp16)[name = string("add_19_cast_fp16")]; int32 softmax_19_axis_0 = const()[name = string("softmax_19_axis_0"), val = int32(-1)]; tensor softmax_19_cast_fp16 = softmax(axis = softmax_19_axis_0, x = add_19_cast_fp16)[name = string("softmax_19_cast_fp16")]; bool attn_output_77_transpose_x_0 = const()[name = string("attn_output_77_transpose_x_0"), val = bool(false)]; bool attn_output_77_transpose_y_0 = const()[name = string("attn_output_77_transpose_y_0"), val = bool(false)]; tensor value_39_cast_fp16 = transpose(perm = value_39_perm_0, x = var_1196_cast_fp16)[name = string("transpose_241")]; tensor attn_output_77_cast_fp16 = matmul(transpose_x = attn_output_77_transpose_x_0, transpose_y = attn_output_77_transpose_y_0, x = softmax_19_cast_fp16, y = value_39_cast_fp16)[name = string("attn_output_77_cast_fp16")]; tensor var_1199_perm_0 = const()[name = string("op_1199_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1201 = const()[name = string("op_1201"), val = tensor([1, 77, -1])]; tensor var_1199_cast_fp16 = transpose(perm = var_1199_perm_0, x = attn_output_77_cast_fp16)[name = string("transpose_240")]; tensor var_1202_cast_fp16 = reshape(shape = var_1201, x = var_1199_cast_fp16)[name = string("op_1202_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(334343424))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(335572288))))[name = string("encoder_text_model_encoder_layers_19_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(335582592)))]; tensor linear_117_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_self_attn_out_proj_weight_to_fp16_palettized, x = var_1202_cast_fp16)[name = string("linear_117_cast_fp16")]; tensor input_235_cast_fp16 = add(x = input_231_cast_fp16, y = linear_117_cast_fp16)[name = string("input_235_cast_fp16")]; tensor input_237_axes_0 = const()[name = string("input_237_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_19_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(335585216)))]; tensor encoder_text_model_encoder_layers_19_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(335587840)))]; tensor input_237_cast_fp16 = layer_norm(axes = input_237_axes_0, beta = encoder_text_model_encoder_layers_19_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_19_layer_norm2_weight_to_fp16, x = input_235_cast_fp16)[name = string("input_237_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(335590464))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(340505728))))[name = string("encoder_text_model_encoder_layers_19_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(340546752)))]; tensor linear_118_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_mlp_fc1_weight_to_fp16_palettized, x = input_237_cast_fp16)[name = string("linear_118_cast_fp16")]; string input_241_mode_0 = const()[name = string("input_241_mode_0"), val = string("EXACT")]; tensor input_241_cast_fp16 = gelu(mode = input_241_mode_0, x = linear_118_cast_fp16)[name = string("input_241_cast_fp16")]; tensor encoder_text_model_encoder_layers_19_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(340557056))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(345472320))))[name = string("encoder_text_model_encoder_layers_19_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_19_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_19_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(345482624)))]; tensor linear_119_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_19_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_19_mlp_fc2_weight_to_fp16_palettized, x = input_241_cast_fp16)[name = string("linear_119_cast_fp16")]; tensor input_243_cast_fp16 = add(x = input_235_cast_fp16, y = linear_119_cast_fp16)[name = string("input_243_cast_fp16")]; tensor hidden_states_121_axes_0 = const()[name = string("hidden_states_121_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_20_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(345485248)))]; tensor encoder_text_model_encoder_layers_20_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(345487872)))]; tensor hidden_states_121_cast_fp16 = layer_norm(axes = hidden_states_121_axes_0, beta = encoder_text_model_encoder_layers_20_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_20_layer_norm1_weight_to_fp16, x = input_243_cast_fp16)[name = string("hidden_states_121_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(345490496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(346719360))))[name = string("encoder_text_model_encoder_layers_20_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(346729664)))]; tensor linear_120_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_121_cast_fp16)[name = string("linear_120_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(346732288))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(347961152))))[name = string("encoder_text_model_encoder_layers_20_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(347971456)))]; tensor linear_121_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_121_cast_fp16)[name = string("linear_121_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(347974080))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(349202944))))[name = string("encoder_text_model_encoder_layers_20_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(349213248)))]; tensor linear_122_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_121_cast_fp16)[name = string("linear_122_cast_fp16")]; tensor var_1245 = const()[name = string("op_1245"), val = tensor([1, 77, -1, 64])]; tensor var_1246_cast_fp16 = reshape(shape = var_1245, x = linear_120_cast_fp16)[name = string("op_1246_cast_fp16")]; tensor var_1248 = const()[name = string("op_1248"), val = tensor([1, 77, -1, 64])]; tensor var_1249_cast_fp16 = reshape(shape = var_1248, x = linear_121_cast_fp16)[name = string("op_1249_cast_fp16")]; tensor var_1251 = const()[name = string("op_1251"), val = tensor([1, 77, -1, 64])]; tensor var_1252_cast_fp16 = reshape(shape = var_1251, x = linear_122_cast_fp16)[name = string("op_1252_cast_fp16")]; tensor value_41_perm_0 = const()[name = string("value_41_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_41_cast_fp16 = mul(x = var_1246_cast_fp16, y = var_11_to_fp16)[name = string("mul_41_cast_fp16")]; bool matmul_20_transpose_y_0 = const()[name = string("matmul_20_transpose_y_0"), val = bool(true)]; bool matmul_20_transpose_x_0 = const()[name = string("matmul_20_transpose_x_0"), val = bool(false)]; tensor transpose_168_perm_0 = const()[name = string("transpose_168_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_169_perm_0 = const()[name = string("transpose_169_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_169 = transpose(perm = transpose_169_perm_0, x = var_1249_cast_fp16)[name = string("transpose_238")]; tensor transpose_168 = transpose(perm = transpose_168_perm_0, x = mul_41_cast_fp16)[name = string("transpose_239")]; tensor matmul_20_cast_fp16 = matmul(transpose_x = matmul_20_transpose_x_0, transpose_y = matmul_20_transpose_y_0, x = transpose_168, y = transpose_169)[name = string("matmul_20_cast_fp16")]; tensor add_20_cast_fp16 = add(x = matmul_20_cast_fp16, y = mul_0_to_fp16)[name = string("add_20_cast_fp16")]; int32 softmax_20_axis_0 = const()[name = string("softmax_20_axis_0"), val = int32(-1)]; tensor softmax_20_cast_fp16 = softmax(axis = softmax_20_axis_0, x = add_20_cast_fp16)[name = string("softmax_20_cast_fp16")]; bool attn_output_81_transpose_x_0 = const()[name = string("attn_output_81_transpose_x_0"), val = bool(false)]; bool attn_output_81_transpose_y_0 = const()[name = string("attn_output_81_transpose_y_0"), val = bool(false)]; tensor value_41_cast_fp16 = transpose(perm = value_41_perm_0, x = var_1252_cast_fp16)[name = string("transpose_237")]; tensor attn_output_81_cast_fp16 = matmul(transpose_x = attn_output_81_transpose_x_0, transpose_y = attn_output_81_transpose_y_0, x = softmax_20_cast_fp16, y = value_41_cast_fp16)[name = string("attn_output_81_cast_fp16")]; tensor var_1255_perm_0 = const()[name = string("op_1255_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1257 = const()[name = string("op_1257"), val = tensor([1, 77, -1])]; tensor var_1255_cast_fp16 = transpose(perm = var_1255_perm_0, x = attn_output_81_cast_fp16)[name = string("transpose_236")]; tensor var_1258_cast_fp16 = reshape(shape = var_1257, x = var_1255_cast_fp16)[name = string("op_1258_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(349215872))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(350444736))))[name = string("encoder_text_model_encoder_layers_20_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(350455040)))]; tensor linear_123_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_self_attn_out_proj_weight_to_fp16_palettized, x = var_1258_cast_fp16)[name = string("linear_123_cast_fp16")]; tensor input_247_cast_fp16 = add(x = input_243_cast_fp16, y = linear_123_cast_fp16)[name = string("input_247_cast_fp16")]; tensor input_249_axes_0 = const()[name = string("input_249_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_20_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(350457664)))]; tensor encoder_text_model_encoder_layers_20_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(350460288)))]; tensor input_249_cast_fp16 = layer_norm(axes = input_249_axes_0, beta = encoder_text_model_encoder_layers_20_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_20_layer_norm2_weight_to_fp16, x = input_247_cast_fp16)[name = string("input_249_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(350462912))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(355378176))))[name = string("encoder_text_model_encoder_layers_20_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(355419200)))]; tensor linear_124_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_mlp_fc1_weight_to_fp16_palettized, x = input_249_cast_fp16)[name = string("linear_124_cast_fp16")]; string input_253_mode_0 = const()[name = string("input_253_mode_0"), val = string("EXACT")]; tensor input_253_cast_fp16 = gelu(mode = input_253_mode_0, x = linear_124_cast_fp16)[name = string("input_253_cast_fp16")]; tensor encoder_text_model_encoder_layers_20_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(355429504))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(360344768))))[name = string("encoder_text_model_encoder_layers_20_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_20_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_20_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(360355072)))]; tensor linear_125_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_20_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_20_mlp_fc2_weight_to_fp16_palettized, x = input_253_cast_fp16)[name = string("linear_125_cast_fp16")]; tensor input_255_cast_fp16 = add(x = input_247_cast_fp16, y = linear_125_cast_fp16)[name = string("input_255_cast_fp16")]; tensor hidden_states_127_axes_0 = const()[name = string("hidden_states_127_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_21_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(360357696)))]; tensor encoder_text_model_encoder_layers_21_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(360360320)))]; tensor hidden_states_127_cast_fp16 = layer_norm(axes = hidden_states_127_axes_0, beta = encoder_text_model_encoder_layers_21_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_21_layer_norm1_weight_to_fp16, x = input_255_cast_fp16)[name = string("hidden_states_127_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(360362944))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(361591808))))[name = string("encoder_text_model_encoder_layers_21_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(361602112)))]; tensor linear_126_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_127_cast_fp16)[name = string("linear_126_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(361604736))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(362833600))))[name = string("encoder_text_model_encoder_layers_21_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(362843904)))]; tensor linear_127_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_127_cast_fp16)[name = string("linear_127_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(362846528))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(364075392))))[name = string("encoder_text_model_encoder_layers_21_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(364085696)))]; tensor linear_128_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_127_cast_fp16)[name = string("linear_128_cast_fp16")]; tensor var_1301 = const()[name = string("op_1301"), val = tensor([1, 77, -1, 64])]; tensor var_1302_cast_fp16 = reshape(shape = var_1301, x = linear_126_cast_fp16)[name = string("op_1302_cast_fp16")]; tensor var_1304 = const()[name = string("op_1304"), val = tensor([1, 77, -1, 64])]; tensor var_1305_cast_fp16 = reshape(shape = var_1304, x = linear_127_cast_fp16)[name = string("op_1305_cast_fp16")]; tensor var_1307 = const()[name = string("op_1307"), val = tensor([1, 77, -1, 64])]; tensor var_1308_cast_fp16 = reshape(shape = var_1307, x = linear_128_cast_fp16)[name = string("op_1308_cast_fp16")]; tensor value_43_perm_0 = const()[name = string("value_43_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_43_cast_fp16 = mul(x = var_1302_cast_fp16, y = var_11_to_fp16)[name = string("mul_43_cast_fp16")]; bool matmul_21_transpose_y_0 = const()[name = string("matmul_21_transpose_y_0"), val = bool(true)]; bool matmul_21_transpose_x_0 = const()[name = string("matmul_21_transpose_x_0"), val = bool(false)]; tensor transpose_170_perm_0 = const()[name = string("transpose_170_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_171_perm_0 = const()[name = string("transpose_171_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_171 = transpose(perm = transpose_171_perm_0, x = var_1305_cast_fp16)[name = string("transpose_234")]; tensor transpose_170 = transpose(perm = transpose_170_perm_0, x = mul_43_cast_fp16)[name = string("transpose_235")]; tensor matmul_21_cast_fp16 = matmul(transpose_x = matmul_21_transpose_x_0, transpose_y = matmul_21_transpose_y_0, x = transpose_170, y = transpose_171)[name = string("matmul_21_cast_fp16")]; tensor add_21_cast_fp16 = add(x = matmul_21_cast_fp16, y = mul_0_to_fp16)[name = string("add_21_cast_fp16")]; int32 softmax_21_axis_0 = const()[name = string("softmax_21_axis_0"), val = int32(-1)]; tensor softmax_21_cast_fp16 = softmax(axis = softmax_21_axis_0, x = add_21_cast_fp16)[name = string("softmax_21_cast_fp16")]; bool attn_output_85_transpose_x_0 = const()[name = string("attn_output_85_transpose_x_0"), val = bool(false)]; bool attn_output_85_transpose_y_0 = const()[name = string("attn_output_85_transpose_y_0"), val = bool(false)]; tensor value_43_cast_fp16 = transpose(perm = value_43_perm_0, x = var_1308_cast_fp16)[name = string("transpose_233")]; tensor attn_output_85_cast_fp16 = matmul(transpose_x = attn_output_85_transpose_x_0, transpose_y = attn_output_85_transpose_y_0, x = softmax_21_cast_fp16, y = value_43_cast_fp16)[name = string("attn_output_85_cast_fp16")]; tensor var_1311_perm_0 = const()[name = string("op_1311_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1313 = const()[name = string("op_1313"), val = tensor([1, 77, -1])]; tensor var_1311_cast_fp16 = transpose(perm = var_1311_perm_0, x = attn_output_85_cast_fp16)[name = string("transpose_232")]; tensor var_1314_cast_fp16 = reshape(shape = var_1313, x = var_1311_cast_fp16)[name = string("op_1314_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(364088320))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(365317184))))[name = string("encoder_text_model_encoder_layers_21_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(365327488)))]; tensor linear_129_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_self_attn_out_proj_weight_to_fp16_palettized, x = var_1314_cast_fp16)[name = string("linear_129_cast_fp16")]; tensor input_259_cast_fp16 = add(x = input_255_cast_fp16, y = linear_129_cast_fp16)[name = string("input_259_cast_fp16")]; tensor input_261_axes_0 = const()[name = string("input_261_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_21_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(365330112)))]; tensor encoder_text_model_encoder_layers_21_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(365332736)))]; tensor input_261_cast_fp16 = layer_norm(axes = input_261_axes_0, beta = encoder_text_model_encoder_layers_21_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_21_layer_norm2_weight_to_fp16, x = input_259_cast_fp16)[name = string("input_261_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(365335360))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(370250624))))[name = string("encoder_text_model_encoder_layers_21_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(370291648)))]; tensor linear_130_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_mlp_fc1_weight_to_fp16_palettized, x = input_261_cast_fp16)[name = string("linear_130_cast_fp16")]; string input_265_mode_0 = const()[name = string("input_265_mode_0"), val = string("EXACT")]; tensor input_265_cast_fp16 = gelu(mode = input_265_mode_0, x = linear_130_cast_fp16)[name = string("input_265_cast_fp16")]; tensor encoder_text_model_encoder_layers_21_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(370301952))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(375217216))))[name = string("encoder_text_model_encoder_layers_21_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_21_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_21_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(375227520)))]; tensor linear_131_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_21_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_21_mlp_fc2_weight_to_fp16_palettized, x = input_265_cast_fp16)[name = string("linear_131_cast_fp16")]; tensor input_267_cast_fp16 = add(x = input_259_cast_fp16, y = linear_131_cast_fp16)[name = string("input_267_cast_fp16")]; tensor hidden_states_133_axes_0 = const()[name = string("hidden_states_133_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_22_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(375230144)))]; tensor encoder_text_model_encoder_layers_22_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(375232768)))]; tensor hidden_states_133_cast_fp16 = layer_norm(axes = hidden_states_133_axes_0, beta = encoder_text_model_encoder_layers_22_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_22_layer_norm1_weight_to_fp16, x = input_267_cast_fp16)[name = string("hidden_states_133_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(375235392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(376464256))))[name = string("encoder_text_model_encoder_layers_22_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(376474560)))]; tensor linear_132_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_133_cast_fp16)[name = string("linear_132_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(376477184))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(377706048))))[name = string("encoder_text_model_encoder_layers_22_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(377716352)))]; tensor linear_133_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_133_cast_fp16)[name = string("linear_133_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(377718976))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(378947840))))[name = string("encoder_text_model_encoder_layers_22_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(378958144)))]; tensor linear_134_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_133_cast_fp16)[name = string("linear_134_cast_fp16")]; tensor var_1357 = const()[name = string("op_1357"), val = tensor([1, 77, -1, 64])]; tensor var_1358_cast_fp16 = reshape(shape = var_1357, x = linear_132_cast_fp16)[name = string("op_1358_cast_fp16")]; tensor var_1360 = const()[name = string("op_1360"), val = tensor([1, 77, -1, 64])]; tensor var_1361_cast_fp16 = reshape(shape = var_1360, x = linear_133_cast_fp16)[name = string("op_1361_cast_fp16")]; tensor var_1363 = const()[name = string("op_1363"), val = tensor([1, 77, -1, 64])]; tensor var_1364_cast_fp16 = reshape(shape = var_1363, x = linear_134_cast_fp16)[name = string("op_1364_cast_fp16")]; tensor value_45_perm_0 = const()[name = string("value_45_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_45_cast_fp16 = mul(x = var_1358_cast_fp16, y = var_11_to_fp16)[name = string("mul_45_cast_fp16")]; bool matmul_22_transpose_y_0 = const()[name = string("matmul_22_transpose_y_0"), val = bool(true)]; bool matmul_22_transpose_x_0 = const()[name = string("matmul_22_transpose_x_0"), val = bool(false)]; tensor transpose_172_perm_0 = const()[name = string("transpose_172_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_173_perm_0 = const()[name = string("transpose_173_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_173 = transpose(perm = transpose_173_perm_0, x = var_1361_cast_fp16)[name = string("transpose_230")]; tensor transpose_172 = transpose(perm = transpose_172_perm_0, x = mul_45_cast_fp16)[name = string("transpose_231")]; tensor matmul_22_cast_fp16 = matmul(transpose_x = matmul_22_transpose_x_0, transpose_y = matmul_22_transpose_y_0, x = transpose_172, y = transpose_173)[name = string("matmul_22_cast_fp16")]; tensor add_22_cast_fp16 = add(x = matmul_22_cast_fp16, y = mul_0_to_fp16)[name = string("add_22_cast_fp16")]; int32 softmax_22_axis_0 = const()[name = string("softmax_22_axis_0"), val = int32(-1)]; tensor softmax_22_cast_fp16 = softmax(axis = softmax_22_axis_0, x = add_22_cast_fp16)[name = string("softmax_22_cast_fp16")]; bool attn_output_89_transpose_x_0 = const()[name = string("attn_output_89_transpose_x_0"), val = bool(false)]; bool attn_output_89_transpose_y_0 = const()[name = string("attn_output_89_transpose_y_0"), val = bool(false)]; tensor value_45_cast_fp16 = transpose(perm = value_45_perm_0, x = var_1364_cast_fp16)[name = string("transpose_229")]; tensor attn_output_89_cast_fp16 = matmul(transpose_x = attn_output_89_transpose_x_0, transpose_y = attn_output_89_transpose_y_0, x = softmax_22_cast_fp16, y = value_45_cast_fp16)[name = string("attn_output_89_cast_fp16")]; tensor var_1367_perm_0 = const()[name = string("op_1367_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1369 = const()[name = string("op_1369"), val = tensor([1, 77, -1])]; tensor var_1367_cast_fp16 = transpose(perm = var_1367_perm_0, x = attn_output_89_cast_fp16)[name = string("transpose_228")]; tensor var_1370_cast_fp16 = reshape(shape = var_1369, x = var_1367_cast_fp16)[name = string("op_1370_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(378960768))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(380189632))))[name = string("encoder_text_model_encoder_layers_22_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(380199936)))]; tensor linear_135_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_self_attn_out_proj_weight_to_fp16_palettized, x = var_1370_cast_fp16)[name = string("linear_135_cast_fp16")]; tensor input_271_cast_fp16 = add(x = input_267_cast_fp16, y = linear_135_cast_fp16)[name = string("input_271_cast_fp16")]; tensor input_273_axes_0 = const()[name = string("input_273_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_22_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(380202560)))]; tensor encoder_text_model_encoder_layers_22_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(380205184)))]; tensor input_273_cast_fp16 = layer_norm(axes = input_273_axes_0, beta = encoder_text_model_encoder_layers_22_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_22_layer_norm2_weight_to_fp16, x = input_271_cast_fp16)[name = string("input_273_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(380207808))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(385123072))))[name = string("encoder_text_model_encoder_layers_22_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(385164096)))]; tensor linear_136_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_mlp_fc1_weight_to_fp16_palettized, x = input_273_cast_fp16)[name = string("linear_136_cast_fp16")]; string input_277_mode_0 = const()[name = string("input_277_mode_0"), val = string("EXACT")]; tensor input_277_cast_fp16 = gelu(mode = input_277_mode_0, x = linear_136_cast_fp16)[name = string("input_277_cast_fp16")]; tensor encoder_text_model_encoder_layers_22_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(385174400))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(390089664))))[name = string("encoder_text_model_encoder_layers_22_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_22_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_22_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(390099968)))]; tensor linear_137_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_22_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_22_mlp_fc2_weight_to_fp16_palettized, x = input_277_cast_fp16)[name = string("linear_137_cast_fp16")]; tensor input_279_cast_fp16 = add(x = input_271_cast_fp16, y = linear_137_cast_fp16)[name = string("input_279_cast_fp16")]; tensor hidden_states_139_axes_0 = const()[name = string("hidden_states_139_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_23_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(390102592)))]; tensor encoder_text_model_encoder_layers_23_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(390105216)))]; tensor hidden_states_139_cast_fp16 = layer_norm(axes = hidden_states_139_axes_0, beta = encoder_text_model_encoder_layers_23_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_23_layer_norm1_weight_to_fp16, x = input_279_cast_fp16)[name = string("hidden_states_139_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(390107840))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(391336704))))[name = string("encoder_text_model_encoder_layers_23_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(391347008)))]; tensor linear_138_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_139_cast_fp16)[name = string("linear_138_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(391349632))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(392578496))))[name = string("encoder_text_model_encoder_layers_23_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(392588800)))]; tensor linear_139_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_139_cast_fp16)[name = string("linear_139_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(392591424))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(393820288))))[name = string("encoder_text_model_encoder_layers_23_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(393830592)))]; tensor linear_140_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_139_cast_fp16)[name = string("linear_140_cast_fp16")]; tensor var_1413 = const()[name = string("op_1413"), val = tensor([1, 77, -1, 64])]; tensor var_1414_cast_fp16 = reshape(shape = var_1413, x = linear_138_cast_fp16)[name = string("op_1414_cast_fp16")]; tensor var_1416 = const()[name = string("op_1416"), val = tensor([1, 77, -1, 64])]; tensor var_1417_cast_fp16 = reshape(shape = var_1416, x = linear_139_cast_fp16)[name = string("op_1417_cast_fp16")]; tensor var_1419 = const()[name = string("op_1419"), val = tensor([1, 77, -1, 64])]; tensor var_1420_cast_fp16 = reshape(shape = var_1419, x = linear_140_cast_fp16)[name = string("op_1420_cast_fp16")]; tensor value_47_perm_0 = const()[name = string("value_47_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_47_cast_fp16 = mul(x = var_1414_cast_fp16, y = var_11_to_fp16)[name = string("mul_47_cast_fp16")]; bool matmul_23_transpose_y_0 = const()[name = string("matmul_23_transpose_y_0"), val = bool(true)]; bool matmul_23_transpose_x_0 = const()[name = string("matmul_23_transpose_x_0"), val = bool(false)]; tensor transpose_174_perm_0 = const()[name = string("transpose_174_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_175_perm_0 = const()[name = string("transpose_175_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_175 = transpose(perm = transpose_175_perm_0, x = var_1417_cast_fp16)[name = string("transpose_226")]; tensor transpose_174 = transpose(perm = transpose_174_perm_0, x = mul_47_cast_fp16)[name = string("transpose_227")]; tensor matmul_23_cast_fp16 = matmul(transpose_x = matmul_23_transpose_x_0, transpose_y = matmul_23_transpose_y_0, x = transpose_174, y = transpose_175)[name = string("matmul_23_cast_fp16")]; tensor add_23_cast_fp16 = add(x = matmul_23_cast_fp16, y = mul_0_to_fp16)[name = string("add_23_cast_fp16")]; int32 softmax_23_axis_0 = const()[name = string("softmax_23_axis_0"), val = int32(-1)]; tensor softmax_23_cast_fp16 = softmax(axis = softmax_23_axis_0, x = add_23_cast_fp16)[name = string("softmax_23_cast_fp16")]; bool attn_output_93_transpose_x_0 = const()[name = string("attn_output_93_transpose_x_0"), val = bool(false)]; bool attn_output_93_transpose_y_0 = const()[name = string("attn_output_93_transpose_y_0"), val = bool(false)]; tensor value_47_cast_fp16 = transpose(perm = value_47_perm_0, x = var_1420_cast_fp16)[name = string("transpose_225")]; tensor attn_output_93_cast_fp16 = matmul(transpose_x = attn_output_93_transpose_x_0, transpose_y = attn_output_93_transpose_y_0, x = softmax_23_cast_fp16, y = value_47_cast_fp16)[name = string("attn_output_93_cast_fp16")]; tensor var_1423_perm_0 = const()[name = string("op_1423_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1425 = const()[name = string("op_1425"), val = tensor([1, 77, -1])]; tensor var_1423_cast_fp16 = transpose(perm = var_1423_perm_0, x = attn_output_93_cast_fp16)[name = string("transpose_224")]; tensor var_1426_cast_fp16 = reshape(shape = var_1425, x = var_1423_cast_fp16)[name = string("op_1426_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(393833216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(395062080))))[name = string("encoder_text_model_encoder_layers_23_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(395072384)))]; tensor linear_141_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_self_attn_out_proj_weight_to_fp16_palettized, x = var_1426_cast_fp16)[name = string("linear_141_cast_fp16")]; tensor input_283_cast_fp16 = add(x = input_279_cast_fp16, y = linear_141_cast_fp16)[name = string("input_283_cast_fp16")]; tensor input_285_axes_0 = const()[name = string("input_285_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_23_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(395075008)))]; tensor encoder_text_model_encoder_layers_23_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(395077632)))]; tensor input_285_cast_fp16 = layer_norm(axes = input_285_axes_0, beta = encoder_text_model_encoder_layers_23_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_23_layer_norm2_weight_to_fp16, x = input_283_cast_fp16)[name = string("input_285_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(395080256))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(399995520))))[name = string("encoder_text_model_encoder_layers_23_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(400036544)))]; tensor linear_142_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_mlp_fc1_weight_to_fp16_palettized, x = input_285_cast_fp16)[name = string("linear_142_cast_fp16")]; string input_289_mode_0 = const()[name = string("input_289_mode_0"), val = string("EXACT")]; tensor input_289_cast_fp16 = gelu(mode = input_289_mode_0, x = linear_142_cast_fp16)[name = string("input_289_cast_fp16")]; tensor encoder_text_model_encoder_layers_23_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(400046848))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(404962112))))[name = string("encoder_text_model_encoder_layers_23_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_23_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_23_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(404972416)))]; tensor linear_143_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_23_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_23_mlp_fc2_weight_to_fp16_palettized, x = input_289_cast_fp16)[name = string("linear_143_cast_fp16")]; tensor input_291_cast_fp16 = add(x = input_283_cast_fp16, y = linear_143_cast_fp16)[name = string("input_291_cast_fp16")]; tensor hidden_states_145_axes_0 = const()[name = string("hidden_states_145_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_24_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(404975040)))]; tensor encoder_text_model_encoder_layers_24_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(404977664)))]; tensor hidden_states_145_cast_fp16 = layer_norm(axes = hidden_states_145_axes_0, beta = encoder_text_model_encoder_layers_24_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_24_layer_norm1_weight_to_fp16, x = input_291_cast_fp16)[name = string("hidden_states_145_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(404980288))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(406209152))))[name = string("encoder_text_model_encoder_layers_24_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(406219456)))]; tensor linear_144_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_145_cast_fp16)[name = string("linear_144_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(406222080))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(407450944))))[name = string("encoder_text_model_encoder_layers_24_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(407461248)))]; tensor linear_145_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_145_cast_fp16)[name = string("linear_145_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(407463872))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(408692736))))[name = string("encoder_text_model_encoder_layers_24_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(408703040)))]; tensor linear_146_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_145_cast_fp16)[name = string("linear_146_cast_fp16")]; tensor var_1469 = const()[name = string("op_1469"), val = tensor([1, 77, -1, 64])]; tensor var_1470_cast_fp16 = reshape(shape = var_1469, x = linear_144_cast_fp16)[name = string("op_1470_cast_fp16")]; tensor var_1472 = const()[name = string("op_1472"), val = tensor([1, 77, -1, 64])]; tensor var_1473_cast_fp16 = reshape(shape = var_1472, x = linear_145_cast_fp16)[name = string("op_1473_cast_fp16")]; tensor var_1475 = const()[name = string("op_1475"), val = tensor([1, 77, -1, 64])]; tensor var_1476_cast_fp16 = reshape(shape = var_1475, x = linear_146_cast_fp16)[name = string("op_1476_cast_fp16")]; tensor value_49_perm_0 = const()[name = string("value_49_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_49_cast_fp16 = mul(x = var_1470_cast_fp16, y = var_11_to_fp16)[name = string("mul_49_cast_fp16")]; bool matmul_24_transpose_y_0 = const()[name = string("matmul_24_transpose_y_0"), val = bool(true)]; bool matmul_24_transpose_x_0 = const()[name = string("matmul_24_transpose_x_0"), val = bool(false)]; tensor transpose_176_perm_0 = const()[name = string("transpose_176_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_177_perm_0 = const()[name = string("transpose_177_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_177 = transpose(perm = transpose_177_perm_0, x = var_1473_cast_fp16)[name = string("transpose_222")]; tensor transpose_176 = transpose(perm = transpose_176_perm_0, x = mul_49_cast_fp16)[name = string("transpose_223")]; tensor matmul_24_cast_fp16 = matmul(transpose_x = matmul_24_transpose_x_0, transpose_y = matmul_24_transpose_y_0, x = transpose_176, y = transpose_177)[name = string("matmul_24_cast_fp16")]; tensor add_24_cast_fp16 = add(x = matmul_24_cast_fp16, y = mul_0_to_fp16)[name = string("add_24_cast_fp16")]; int32 softmax_24_axis_0 = const()[name = string("softmax_24_axis_0"), val = int32(-1)]; tensor softmax_24_cast_fp16 = softmax(axis = softmax_24_axis_0, x = add_24_cast_fp16)[name = string("softmax_24_cast_fp16")]; bool attn_output_97_transpose_x_0 = const()[name = string("attn_output_97_transpose_x_0"), val = bool(false)]; bool attn_output_97_transpose_y_0 = const()[name = string("attn_output_97_transpose_y_0"), val = bool(false)]; tensor value_49_cast_fp16 = transpose(perm = value_49_perm_0, x = var_1476_cast_fp16)[name = string("transpose_221")]; tensor attn_output_97_cast_fp16 = matmul(transpose_x = attn_output_97_transpose_x_0, transpose_y = attn_output_97_transpose_y_0, x = softmax_24_cast_fp16, y = value_49_cast_fp16)[name = string("attn_output_97_cast_fp16")]; tensor var_1479_perm_0 = const()[name = string("op_1479_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1481 = const()[name = string("op_1481"), val = tensor([1, 77, -1])]; tensor var_1479_cast_fp16 = transpose(perm = var_1479_perm_0, x = attn_output_97_cast_fp16)[name = string("transpose_220")]; tensor var_1482_cast_fp16 = reshape(shape = var_1481, x = var_1479_cast_fp16)[name = string("op_1482_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(408705664))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(409934528))))[name = string("encoder_text_model_encoder_layers_24_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(409944832)))]; tensor linear_147_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_self_attn_out_proj_weight_to_fp16_palettized, x = var_1482_cast_fp16)[name = string("linear_147_cast_fp16")]; tensor input_295_cast_fp16 = add(x = input_291_cast_fp16, y = linear_147_cast_fp16)[name = string("input_295_cast_fp16")]; tensor input_297_axes_0 = const()[name = string("input_297_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_24_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(409947456)))]; tensor encoder_text_model_encoder_layers_24_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(409950080)))]; tensor input_297_cast_fp16 = layer_norm(axes = input_297_axes_0, beta = encoder_text_model_encoder_layers_24_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_24_layer_norm2_weight_to_fp16, x = input_295_cast_fp16)[name = string("input_297_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(409952704))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(414867968))))[name = string("encoder_text_model_encoder_layers_24_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(414908992)))]; tensor linear_148_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_mlp_fc1_weight_to_fp16_palettized, x = input_297_cast_fp16)[name = string("linear_148_cast_fp16")]; string input_301_mode_0 = const()[name = string("input_301_mode_0"), val = string("EXACT")]; tensor input_301_cast_fp16 = gelu(mode = input_301_mode_0, x = linear_148_cast_fp16)[name = string("input_301_cast_fp16")]; tensor encoder_text_model_encoder_layers_24_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(414919296))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(419834560))))[name = string("encoder_text_model_encoder_layers_24_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_24_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_24_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(419844864)))]; tensor linear_149_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_24_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_24_mlp_fc2_weight_to_fp16_palettized, x = input_301_cast_fp16)[name = string("linear_149_cast_fp16")]; tensor input_303_cast_fp16 = add(x = input_295_cast_fp16, y = linear_149_cast_fp16)[name = string("input_303_cast_fp16")]; tensor hidden_states_151_axes_0 = const()[name = string("hidden_states_151_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_25_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(419847488)))]; tensor encoder_text_model_encoder_layers_25_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(419850112)))]; tensor hidden_states_151_cast_fp16 = layer_norm(axes = hidden_states_151_axes_0, beta = encoder_text_model_encoder_layers_25_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_25_layer_norm1_weight_to_fp16, x = input_303_cast_fp16)[name = string("hidden_states_151_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(419852736))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(421081600))))[name = string("encoder_text_model_encoder_layers_25_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(421091904)))]; tensor linear_150_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_151_cast_fp16)[name = string("linear_150_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(421094528))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(422323392))))[name = string("encoder_text_model_encoder_layers_25_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(422333696)))]; tensor linear_151_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_151_cast_fp16)[name = string("linear_151_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(422336320))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(423565184))))[name = string("encoder_text_model_encoder_layers_25_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(423575488)))]; tensor linear_152_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_151_cast_fp16)[name = string("linear_152_cast_fp16")]; tensor var_1525 = const()[name = string("op_1525"), val = tensor([1, 77, -1, 64])]; tensor var_1526_cast_fp16 = reshape(shape = var_1525, x = linear_150_cast_fp16)[name = string("op_1526_cast_fp16")]; tensor var_1528 = const()[name = string("op_1528"), val = tensor([1, 77, -1, 64])]; tensor var_1529_cast_fp16 = reshape(shape = var_1528, x = linear_151_cast_fp16)[name = string("op_1529_cast_fp16")]; tensor var_1531 = const()[name = string("op_1531"), val = tensor([1, 77, -1, 64])]; tensor var_1532_cast_fp16 = reshape(shape = var_1531, x = linear_152_cast_fp16)[name = string("op_1532_cast_fp16")]; tensor value_51_perm_0 = const()[name = string("value_51_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_51_cast_fp16 = mul(x = var_1526_cast_fp16, y = var_11_to_fp16)[name = string("mul_51_cast_fp16")]; bool matmul_25_transpose_y_0 = const()[name = string("matmul_25_transpose_y_0"), val = bool(true)]; bool matmul_25_transpose_x_0 = const()[name = string("matmul_25_transpose_x_0"), val = bool(false)]; tensor transpose_178_perm_0 = const()[name = string("transpose_178_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_179_perm_0 = const()[name = string("transpose_179_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_179 = transpose(perm = transpose_179_perm_0, x = var_1529_cast_fp16)[name = string("transpose_218")]; tensor transpose_178 = transpose(perm = transpose_178_perm_0, x = mul_51_cast_fp16)[name = string("transpose_219")]; tensor matmul_25_cast_fp16 = matmul(transpose_x = matmul_25_transpose_x_0, transpose_y = matmul_25_transpose_y_0, x = transpose_178, y = transpose_179)[name = string("matmul_25_cast_fp16")]; tensor add_25_cast_fp16 = add(x = matmul_25_cast_fp16, y = mul_0_to_fp16)[name = string("add_25_cast_fp16")]; int32 softmax_25_axis_0 = const()[name = string("softmax_25_axis_0"), val = int32(-1)]; tensor softmax_25_cast_fp16 = softmax(axis = softmax_25_axis_0, x = add_25_cast_fp16)[name = string("softmax_25_cast_fp16")]; bool attn_output_101_transpose_x_0 = const()[name = string("attn_output_101_transpose_x_0"), val = bool(false)]; bool attn_output_101_transpose_y_0 = const()[name = string("attn_output_101_transpose_y_0"), val = bool(false)]; tensor value_51_cast_fp16 = transpose(perm = value_51_perm_0, x = var_1532_cast_fp16)[name = string("transpose_217")]; tensor attn_output_101_cast_fp16 = matmul(transpose_x = attn_output_101_transpose_x_0, transpose_y = attn_output_101_transpose_y_0, x = softmax_25_cast_fp16, y = value_51_cast_fp16)[name = string("attn_output_101_cast_fp16")]; tensor var_1535_perm_0 = const()[name = string("op_1535_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1537 = const()[name = string("op_1537"), val = tensor([1, 77, -1])]; tensor var_1535_cast_fp16 = transpose(perm = var_1535_perm_0, x = attn_output_101_cast_fp16)[name = string("transpose_216")]; tensor var_1538_cast_fp16 = reshape(shape = var_1537, x = var_1535_cast_fp16)[name = string("op_1538_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(423578112))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(424806976))))[name = string("encoder_text_model_encoder_layers_25_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(424817280)))]; tensor linear_153_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_self_attn_out_proj_weight_to_fp16_palettized, x = var_1538_cast_fp16)[name = string("linear_153_cast_fp16")]; tensor input_307_cast_fp16 = add(x = input_303_cast_fp16, y = linear_153_cast_fp16)[name = string("input_307_cast_fp16")]; tensor input_309_axes_0 = const()[name = string("input_309_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_25_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(424819904)))]; tensor encoder_text_model_encoder_layers_25_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(424822528)))]; tensor input_309_cast_fp16 = layer_norm(axes = input_309_axes_0, beta = encoder_text_model_encoder_layers_25_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_25_layer_norm2_weight_to_fp16, x = input_307_cast_fp16)[name = string("input_309_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(424825152))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(429740416))))[name = string("encoder_text_model_encoder_layers_25_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(429781440)))]; tensor linear_154_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_mlp_fc1_weight_to_fp16_palettized, x = input_309_cast_fp16)[name = string("linear_154_cast_fp16")]; string input_313_mode_0 = const()[name = string("input_313_mode_0"), val = string("EXACT")]; tensor input_313_cast_fp16 = gelu(mode = input_313_mode_0, x = linear_154_cast_fp16)[name = string("input_313_cast_fp16")]; tensor encoder_text_model_encoder_layers_25_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(429791744))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(434707008))))[name = string("encoder_text_model_encoder_layers_25_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_25_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_25_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(434717312)))]; tensor linear_155_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_25_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_25_mlp_fc2_weight_to_fp16_palettized, x = input_313_cast_fp16)[name = string("linear_155_cast_fp16")]; tensor input_315_cast_fp16 = add(x = input_307_cast_fp16, y = linear_155_cast_fp16)[name = string("input_315_cast_fp16")]; tensor hidden_states_157_axes_0 = const()[name = string("hidden_states_157_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_26_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(434719936)))]; tensor encoder_text_model_encoder_layers_26_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(434722560)))]; tensor hidden_states_157_cast_fp16 = layer_norm(axes = hidden_states_157_axes_0, beta = encoder_text_model_encoder_layers_26_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_26_layer_norm1_weight_to_fp16, x = input_315_cast_fp16)[name = string("hidden_states_157_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(434725184))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(435954048))))[name = string("encoder_text_model_encoder_layers_26_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(435964352)))]; tensor linear_156_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_157_cast_fp16)[name = string("linear_156_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(435966976))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(437195840))))[name = string("encoder_text_model_encoder_layers_26_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(437206144)))]; tensor linear_157_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_157_cast_fp16)[name = string("linear_157_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(437208768))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(438437632))))[name = string("encoder_text_model_encoder_layers_26_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(438447936)))]; tensor linear_158_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_157_cast_fp16)[name = string("linear_158_cast_fp16")]; tensor var_1581 = const()[name = string("op_1581"), val = tensor([1, 77, -1, 64])]; tensor var_1582_cast_fp16 = reshape(shape = var_1581, x = linear_156_cast_fp16)[name = string("op_1582_cast_fp16")]; tensor var_1584 = const()[name = string("op_1584"), val = tensor([1, 77, -1, 64])]; tensor var_1585_cast_fp16 = reshape(shape = var_1584, x = linear_157_cast_fp16)[name = string("op_1585_cast_fp16")]; tensor var_1587 = const()[name = string("op_1587"), val = tensor([1, 77, -1, 64])]; tensor var_1588_cast_fp16 = reshape(shape = var_1587, x = linear_158_cast_fp16)[name = string("op_1588_cast_fp16")]; tensor value_53_perm_0 = const()[name = string("value_53_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_53_cast_fp16 = mul(x = var_1582_cast_fp16, y = var_11_to_fp16)[name = string("mul_53_cast_fp16")]; bool matmul_26_transpose_y_0 = const()[name = string("matmul_26_transpose_y_0"), val = bool(true)]; bool matmul_26_transpose_x_0 = const()[name = string("matmul_26_transpose_x_0"), val = bool(false)]; tensor transpose_180_perm_0 = const()[name = string("transpose_180_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_181_perm_0 = const()[name = string("transpose_181_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_181 = transpose(perm = transpose_181_perm_0, x = var_1585_cast_fp16)[name = string("transpose_214")]; tensor transpose_180 = transpose(perm = transpose_180_perm_0, x = mul_53_cast_fp16)[name = string("transpose_215")]; tensor matmul_26_cast_fp16 = matmul(transpose_x = matmul_26_transpose_x_0, transpose_y = matmul_26_transpose_y_0, x = transpose_180, y = transpose_181)[name = string("matmul_26_cast_fp16")]; tensor add_26_cast_fp16 = add(x = matmul_26_cast_fp16, y = mul_0_to_fp16)[name = string("add_26_cast_fp16")]; int32 softmax_26_axis_0 = const()[name = string("softmax_26_axis_0"), val = int32(-1)]; tensor softmax_26_cast_fp16 = softmax(axis = softmax_26_axis_0, x = add_26_cast_fp16)[name = string("softmax_26_cast_fp16")]; bool attn_output_105_transpose_x_0 = const()[name = string("attn_output_105_transpose_x_0"), val = bool(false)]; bool attn_output_105_transpose_y_0 = const()[name = string("attn_output_105_transpose_y_0"), val = bool(false)]; tensor value_53_cast_fp16 = transpose(perm = value_53_perm_0, x = var_1588_cast_fp16)[name = string("transpose_213")]; tensor attn_output_105_cast_fp16 = matmul(transpose_x = attn_output_105_transpose_x_0, transpose_y = attn_output_105_transpose_y_0, x = softmax_26_cast_fp16, y = value_53_cast_fp16)[name = string("attn_output_105_cast_fp16")]; tensor var_1591_perm_0 = const()[name = string("op_1591_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1593 = const()[name = string("op_1593"), val = tensor([1, 77, -1])]; tensor var_1591_cast_fp16 = transpose(perm = var_1591_perm_0, x = attn_output_105_cast_fp16)[name = string("transpose_212")]; tensor var_1594_cast_fp16 = reshape(shape = var_1593, x = var_1591_cast_fp16)[name = string("op_1594_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(438450560))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(439679424))))[name = string("encoder_text_model_encoder_layers_26_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(439689728)))]; tensor linear_159_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_self_attn_out_proj_weight_to_fp16_palettized, x = var_1594_cast_fp16)[name = string("linear_159_cast_fp16")]; tensor input_319_cast_fp16 = add(x = input_315_cast_fp16, y = linear_159_cast_fp16)[name = string("input_319_cast_fp16")]; tensor input_321_axes_0 = const()[name = string("input_321_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_26_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(439692352)))]; tensor encoder_text_model_encoder_layers_26_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(439694976)))]; tensor input_321_cast_fp16 = layer_norm(axes = input_321_axes_0, beta = encoder_text_model_encoder_layers_26_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_26_layer_norm2_weight_to_fp16, x = input_319_cast_fp16)[name = string("input_321_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(439697600))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(444612864))))[name = string("encoder_text_model_encoder_layers_26_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(444653888)))]; tensor linear_160_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_mlp_fc1_weight_to_fp16_palettized, x = input_321_cast_fp16)[name = string("linear_160_cast_fp16")]; string input_325_mode_0 = const()[name = string("input_325_mode_0"), val = string("EXACT")]; tensor input_325_cast_fp16 = gelu(mode = input_325_mode_0, x = linear_160_cast_fp16)[name = string("input_325_cast_fp16")]; tensor encoder_text_model_encoder_layers_26_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(444664192))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(449579456))))[name = string("encoder_text_model_encoder_layers_26_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_26_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_26_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(449589760)))]; tensor linear_161_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_26_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_26_mlp_fc2_weight_to_fp16_palettized, x = input_325_cast_fp16)[name = string("linear_161_cast_fp16")]; tensor input_327_cast_fp16 = add(x = input_319_cast_fp16, y = linear_161_cast_fp16)[name = string("input_327_cast_fp16")]; tensor hidden_states_163_axes_0 = const()[name = string("hidden_states_163_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_27_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(449592384)))]; tensor encoder_text_model_encoder_layers_27_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(449595008)))]; tensor hidden_states_163_cast_fp16 = layer_norm(axes = hidden_states_163_axes_0, beta = encoder_text_model_encoder_layers_27_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_27_layer_norm1_weight_to_fp16, x = input_327_cast_fp16)[name = string("hidden_states_163_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(449597632))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(450826496))))[name = string("encoder_text_model_encoder_layers_27_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(450836800)))]; tensor linear_162_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_163_cast_fp16)[name = string("linear_162_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(450839424))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(452068288))))[name = string("encoder_text_model_encoder_layers_27_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(452078592)))]; tensor linear_163_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_163_cast_fp16)[name = string("linear_163_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(452081216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(453310080))))[name = string("encoder_text_model_encoder_layers_27_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(453320384)))]; tensor linear_164_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_163_cast_fp16)[name = string("linear_164_cast_fp16")]; tensor var_1637 = const()[name = string("op_1637"), val = tensor([1, 77, -1, 64])]; tensor var_1638_cast_fp16 = reshape(shape = var_1637, x = linear_162_cast_fp16)[name = string("op_1638_cast_fp16")]; tensor var_1640 = const()[name = string("op_1640"), val = tensor([1, 77, -1, 64])]; tensor var_1641_cast_fp16 = reshape(shape = var_1640, x = linear_163_cast_fp16)[name = string("op_1641_cast_fp16")]; tensor var_1643 = const()[name = string("op_1643"), val = tensor([1, 77, -1, 64])]; tensor var_1644_cast_fp16 = reshape(shape = var_1643, x = linear_164_cast_fp16)[name = string("op_1644_cast_fp16")]; tensor value_55_perm_0 = const()[name = string("value_55_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_55_cast_fp16 = mul(x = var_1638_cast_fp16, y = var_11_to_fp16)[name = string("mul_55_cast_fp16")]; bool matmul_27_transpose_y_0 = const()[name = string("matmul_27_transpose_y_0"), val = bool(true)]; bool matmul_27_transpose_x_0 = const()[name = string("matmul_27_transpose_x_0"), val = bool(false)]; tensor transpose_182_perm_0 = const()[name = string("transpose_182_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_183_perm_0 = const()[name = string("transpose_183_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_183 = transpose(perm = transpose_183_perm_0, x = var_1641_cast_fp16)[name = string("transpose_210")]; tensor transpose_182 = transpose(perm = transpose_182_perm_0, x = mul_55_cast_fp16)[name = string("transpose_211")]; tensor matmul_27_cast_fp16 = matmul(transpose_x = matmul_27_transpose_x_0, transpose_y = matmul_27_transpose_y_0, x = transpose_182, y = transpose_183)[name = string("matmul_27_cast_fp16")]; tensor add_27_cast_fp16 = add(x = matmul_27_cast_fp16, y = mul_0_to_fp16)[name = string("add_27_cast_fp16")]; int32 softmax_27_axis_0 = const()[name = string("softmax_27_axis_0"), val = int32(-1)]; tensor softmax_27_cast_fp16 = softmax(axis = softmax_27_axis_0, x = add_27_cast_fp16)[name = string("softmax_27_cast_fp16")]; bool attn_output_109_transpose_x_0 = const()[name = string("attn_output_109_transpose_x_0"), val = bool(false)]; bool attn_output_109_transpose_y_0 = const()[name = string("attn_output_109_transpose_y_0"), val = bool(false)]; tensor value_55_cast_fp16 = transpose(perm = value_55_perm_0, x = var_1644_cast_fp16)[name = string("transpose_209")]; tensor attn_output_109_cast_fp16 = matmul(transpose_x = attn_output_109_transpose_x_0, transpose_y = attn_output_109_transpose_y_0, x = softmax_27_cast_fp16, y = value_55_cast_fp16)[name = string("attn_output_109_cast_fp16")]; tensor var_1647_perm_0 = const()[name = string("op_1647_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1649 = const()[name = string("op_1649"), val = tensor([1, 77, -1])]; tensor var_1647_cast_fp16 = transpose(perm = var_1647_perm_0, x = attn_output_109_cast_fp16)[name = string("transpose_208")]; tensor var_1650_cast_fp16 = reshape(shape = var_1649, x = var_1647_cast_fp16)[name = string("op_1650_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(453323008))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(454551872))))[name = string("encoder_text_model_encoder_layers_27_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(454562176)))]; tensor linear_165_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_self_attn_out_proj_weight_to_fp16_palettized, x = var_1650_cast_fp16)[name = string("linear_165_cast_fp16")]; tensor input_331_cast_fp16 = add(x = input_327_cast_fp16, y = linear_165_cast_fp16)[name = string("input_331_cast_fp16")]; tensor input_333_axes_0 = const()[name = string("input_333_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_27_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(454564800)))]; tensor encoder_text_model_encoder_layers_27_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(454567424)))]; tensor input_333_cast_fp16 = layer_norm(axes = input_333_axes_0, beta = encoder_text_model_encoder_layers_27_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_27_layer_norm2_weight_to_fp16, x = input_331_cast_fp16)[name = string("input_333_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(454570048))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(459485312))))[name = string("encoder_text_model_encoder_layers_27_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(459526336)))]; tensor linear_166_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_mlp_fc1_weight_to_fp16_palettized, x = input_333_cast_fp16)[name = string("linear_166_cast_fp16")]; string input_337_mode_0 = const()[name = string("input_337_mode_0"), val = string("EXACT")]; tensor input_337_cast_fp16 = gelu(mode = input_337_mode_0, x = linear_166_cast_fp16)[name = string("input_337_cast_fp16")]; tensor encoder_text_model_encoder_layers_27_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(459536640))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(464451904))))[name = string("encoder_text_model_encoder_layers_27_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_27_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_27_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(464462208)))]; tensor linear_167_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_27_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_27_mlp_fc2_weight_to_fp16_palettized, x = input_337_cast_fp16)[name = string("linear_167_cast_fp16")]; tensor input_339_cast_fp16 = add(x = input_331_cast_fp16, y = linear_167_cast_fp16)[name = string("input_339_cast_fp16")]; tensor hidden_states_169_axes_0 = const()[name = string("hidden_states_169_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_28_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(464464832)))]; tensor encoder_text_model_encoder_layers_28_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(464467456)))]; tensor hidden_states_169_cast_fp16 = layer_norm(axes = hidden_states_169_axes_0, beta = encoder_text_model_encoder_layers_28_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_28_layer_norm1_weight_to_fp16, x = input_339_cast_fp16)[name = string("hidden_states_169_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(464470080))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(465698944))))[name = string("encoder_text_model_encoder_layers_28_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(465709248)))]; tensor linear_168_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_169_cast_fp16)[name = string("linear_168_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(465711872))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(466940736))))[name = string("encoder_text_model_encoder_layers_28_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(466951040)))]; tensor linear_169_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_169_cast_fp16)[name = string("linear_169_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(466953664))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(468182528))))[name = string("encoder_text_model_encoder_layers_28_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(468192832)))]; tensor linear_170_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_169_cast_fp16)[name = string("linear_170_cast_fp16")]; tensor var_1693 = const()[name = string("op_1693"), val = tensor([1, 77, -1, 64])]; tensor var_1694_cast_fp16 = reshape(shape = var_1693, x = linear_168_cast_fp16)[name = string("op_1694_cast_fp16")]; tensor var_1696 = const()[name = string("op_1696"), val = tensor([1, 77, -1, 64])]; tensor var_1697_cast_fp16 = reshape(shape = var_1696, x = linear_169_cast_fp16)[name = string("op_1697_cast_fp16")]; tensor var_1699 = const()[name = string("op_1699"), val = tensor([1, 77, -1, 64])]; tensor var_1700_cast_fp16 = reshape(shape = var_1699, x = linear_170_cast_fp16)[name = string("op_1700_cast_fp16")]; tensor value_57_perm_0 = const()[name = string("value_57_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_57_cast_fp16 = mul(x = var_1694_cast_fp16, y = var_11_to_fp16)[name = string("mul_57_cast_fp16")]; bool matmul_28_transpose_y_0 = const()[name = string("matmul_28_transpose_y_0"), val = bool(true)]; bool matmul_28_transpose_x_0 = const()[name = string("matmul_28_transpose_x_0"), val = bool(false)]; tensor transpose_184_perm_0 = const()[name = string("transpose_184_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_185_perm_0 = const()[name = string("transpose_185_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_185 = transpose(perm = transpose_185_perm_0, x = var_1697_cast_fp16)[name = string("transpose_206")]; tensor transpose_184 = transpose(perm = transpose_184_perm_0, x = mul_57_cast_fp16)[name = string("transpose_207")]; tensor matmul_28_cast_fp16 = matmul(transpose_x = matmul_28_transpose_x_0, transpose_y = matmul_28_transpose_y_0, x = transpose_184, y = transpose_185)[name = string("matmul_28_cast_fp16")]; tensor add_28_cast_fp16 = add(x = matmul_28_cast_fp16, y = mul_0_to_fp16)[name = string("add_28_cast_fp16")]; int32 softmax_28_axis_0 = const()[name = string("softmax_28_axis_0"), val = int32(-1)]; tensor softmax_28_cast_fp16 = softmax(axis = softmax_28_axis_0, x = add_28_cast_fp16)[name = string("softmax_28_cast_fp16")]; bool attn_output_113_transpose_x_0 = const()[name = string("attn_output_113_transpose_x_0"), val = bool(false)]; bool attn_output_113_transpose_y_0 = const()[name = string("attn_output_113_transpose_y_0"), val = bool(false)]; tensor value_57_cast_fp16 = transpose(perm = value_57_perm_0, x = var_1700_cast_fp16)[name = string("transpose_205")]; tensor attn_output_113_cast_fp16 = matmul(transpose_x = attn_output_113_transpose_x_0, transpose_y = attn_output_113_transpose_y_0, x = softmax_28_cast_fp16, y = value_57_cast_fp16)[name = string("attn_output_113_cast_fp16")]; tensor var_1703_perm_0 = const()[name = string("op_1703_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1705 = const()[name = string("op_1705"), val = tensor([1, 77, -1])]; tensor var_1703_cast_fp16 = transpose(perm = var_1703_perm_0, x = attn_output_113_cast_fp16)[name = string("transpose_204")]; tensor var_1706_cast_fp16 = reshape(shape = var_1705, x = var_1703_cast_fp16)[name = string("op_1706_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(468195456))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(469424320))))[name = string("encoder_text_model_encoder_layers_28_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(469434624)))]; tensor linear_171_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_self_attn_out_proj_weight_to_fp16_palettized, x = var_1706_cast_fp16)[name = string("linear_171_cast_fp16")]; tensor input_343_cast_fp16 = add(x = input_339_cast_fp16, y = linear_171_cast_fp16)[name = string("input_343_cast_fp16")]; tensor input_345_axes_0 = const()[name = string("input_345_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_28_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(469437248)))]; tensor encoder_text_model_encoder_layers_28_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(469439872)))]; tensor input_345_cast_fp16 = layer_norm(axes = input_345_axes_0, beta = encoder_text_model_encoder_layers_28_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_28_layer_norm2_weight_to_fp16, x = input_343_cast_fp16)[name = string("input_345_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(469442496))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(474357760))))[name = string("encoder_text_model_encoder_layers_28_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(474398784)))]; tensor linear_172_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_mlp_fc1_weight_to_fp16_palettized, x = input_345_cast_fp16)[name = string("linear_172_cast_fp16")]; string input_349_mode_0 = const()[name = string("input_349_mode_0"), val = string("EXACT")]; tensor input_349_cast_fp16 = gelu(mode = input_349_mode_0, x = linear_172_cast_fp16)[name = string("input_349_cast_fp16")]; tensor encoder_text_model_encoder_layers_28_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(474409088))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(479324352))))[name = string("encoder_text_model_encoder_layers_28_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_28_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_28_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(479334656)))]; tensor linear_173_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_28_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_28_mlp_fc2_weight_to_fp16_palettized, x = input_349_cast_fp16)[name = string("linear_173_cast_fp16")]; tensor input_351_cast_fp16 = add(x = input_343_cast_fp16, y = linear_173_cast_fp16)[name = string("input_351_cast_fp16")]; tensor hidden_states_175_axes_0 = const()[name = string("hidden_states_175_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_29_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(479337280)))]; tensor encoder_text_model_encoder_layers_29_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(479339904)))]; tensor hidden_states_175_cast_fp16 = layer_norm(axes = hidden_states_175_axes_0, beta = encoder_text_model_encoder_layers_29_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_29_layer_norm1_weight_to_fp16, x = input_351_cast_fp16)[name = string("hidden_states_175_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(479342528))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(480571392))))[name = string("encoder_text_model_encoder_layers_29_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(480581696)))]; tensor linear_174_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_175_cast_fp16)[name = string("linear_174_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(480584320))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(481813184))))[name = string("encoder_text_model_encoder_layers_29_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(481823488)))]; tensor linear_175_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_175_cast_fp16)[name = string("linear_175_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(481826112))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(483054976))))[name = string("encoder_text_model_encoder_layers_29_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(483065280)))]; tensor linear_176_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_175_cast_fp16)[name = string("linear_176_cast_fp16")]; tensor var_1749 = const()[name = string("op_1749"), val = tensor([1, 77, -1, 64])]; tensor var_1750_cast_fp16 = reshape(shape = var_1749, x = linear_174_cast_fp16)[name = string("op_1750_cast_fp16")]; tensor var_1752 = const()[name = string("op_1752"), val = tensor([1, 77, -1, 64])]; tensor var_1753_cast_fp16 = reshape(shape = var_1752, x = linear_175_cast_fp16)[name = string("op_1753_cast_fp16")]; tensor var_1755 = const()[name = string("op_1755"), val = tensor([1, 77, -1, 64])]; tensor var_1756_cast_fp16 = reshape(shape = var_1755, x = linear_176_cast_fp16)[name = string("op_1756_cast_fp16")]; tensor value_59_perm_0 = const()[name = string("value_59_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_59_cast_fp16 = mul(x = var_1750_cast_fp16, y = var_11_to_fp16)[name = string("mul_59_cast_fp16")]; bool matmul_29_transpose_y_0 = const()[name = string("matmul_29_transpose_y_0"), val = bool(true)]; bool matmul_29_transpose_x_0 = const()[name = string("matmul_29_transpose_x_0"), val = bool(false)]; tensor transpose_186_perm_0 = const()[name = string("transpose_186_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_187_perm_0 = const()[name = string("transpose_187_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_187 = transpose(perm = transpose_187_perm_0, x = var_1753_cast_fp16)[name = string("transpose_202")]; tensor transpose_186 = transpose(perm = transpose_186_perm_0, x = mul_59_cast_fp16)[name = string("transpose_203")]; tensor matmul_29_cast_fp16 = matmul(transpose_x = matmul_29_transpose_x_0, transpose_y = matmul_29_transpose_y_0, x = transpose_186, y = transpose_187)[name = string("matmul_29_cast_fp16")]; tensor add_29_cast_fp16 = add(x = matmul_29_cast_fp16, y = mul_0_to_fp16)[name = string("add_29_cast_fp16")]; int32 softmax_29_axis_0 = const()[name = string("softmax_29_axis_0"), val = int32(-1)]; tensor softmax_29_cast_fp16 = softmax(axis = softmax_29_axis_0, x = add_29_cast_fp16)[name = string("softmax_29_cast_fp16")]; bool attn_output_117_transpose_x_0 = const()[name = string("attn_output_117_transpose_x_0"), val = bool(false)]; bool attn_output_117_transpose_y_0 = const()[name = string("attn_output_117_transpose_y_0"), val = bool(false)]; tensor value_59_cast_fp16 = transpose(perm = value_59_perm_0, x = var_1756_cast_fp16)[name = string("transpose_201")]; tensor attn_output_117_cast_fp16 = matmul(transpose_x = attn_output_117_transpose_x_0, transpose_y = attn_output_117_transpose_y_0, x = softmax_29_cast_fp16, y = value_59_cast_fp16)[name = string("attn_output_117_cast_fp16")]; tensor var_1759_perm_0 = const()[name = string("op_1759_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1761 = const()[name = string("op_1761"), val = tensor([1, 77, -1])]; tensor var_1759_cast_fp16 = transpose(perm = var_1759_perm_0, x = attn_output_117_cast_fp16)[name = string("transpose_200")]; tensor var_1762_cast_fp16 = reshape(shape = var_1761, x = var_1759_cast_fp16)[name = string("op_1762_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(483067904))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(484296768))))[name = string("encoder_text_model_encoder_layers_29_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(484307072)))]; tensor linear_177_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_self_attn_out_proj_weight_to_fp16_palettized, x = var_1762_cast_fp16)[name = string("linear_177_cast_fp16")]; tensor input_355_cast_fp16 = add(x = input_351_cast_fp16, y = linear_177_cast_fp16)[name = string("input_355_cast_fp16")]; tensor input_357_axes_0 = const()[name = string("input_357_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_29_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(484309696)))]; tensor encoder_text_model_encoder_layers_29_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(484312320)))]; tensor input_357_cast_fp16 = layer_norm(axes = input_357_axes_0, beta = encoder_text_model_encoder_layers_29_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_29_layer_norm2_weight_to_fp16, x = input_355_cast_fp16)[name = string("input_357_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(484314944))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(489230208))))[name = string("encoder_text_model_encoder_layers_29_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(489271232)))]; tensor linear_178_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_mlp_fc1_weight_to_fp16_palettized, x = input_357_cast_fp16)[name = string("linear_178_cast_fp16")]; string input_361_mode_0 = const()[name = string("input_361_mode_0"), val = string("EXACT")]; tensor input_361_cast_fp16 = gelu(mode = input_361_mode_0, x = linear_178_cast_fp16)[name = string("input_361_cast_fp16")]; tensor encoder_text_model_encoder_layers_29_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(489281536))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(494196800))))[name = string("encoder_text_model_encoder_layers_29_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_29_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_29_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(494207104)))]; tensor linear_179_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_29_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_29_mlp_fc2_weight_to_fp16_palettized, x = input_361_cast_fp16)[name = string("linear_179_cast_fp16")]; tensor input_363_cast_fp16 = add(x = input_355_cast_fp16, y = linear_179_cast_fp16)[name = string("input_363_cast_fp16")]; tensor hidden_states_181_axes_0 = const()[name = string("hidden_states_181_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_30_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(494209728)))]; tensor encoder_text_model_encoder_layers_30_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(494212352)))]; tensor hidden_states_181_cast_fp16 = layer_norm(axes = hidden_states_181_axes_0, beta = encoder_text_model_encoder_layers_30_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_30_layer_norm1_weight_to_fp16, x = input_363_cast_fp16)[name = string("hidden_states_181_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(494214976))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(495443840))))[name = string("encoder_text_model_encoder_layers_30_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(495454144)))]; tensor linear_180_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_181_cast_fp16)[name = string("linear_180_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(495456768))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(496685632))))[name = string("encoder_text_model_encoder_layers_30_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(496695936)))]; tensor linear_181_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_181_cast_fp16)[name = string("linear_181_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(496698560))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(497927424))))[name = string("encoder_text_model_encoder_layers_30_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(497937728)))]; tensor linear_182_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_181_cast_fp16)[name = string("linear_182_cast_fp16")]; tensor var_1805 = const()[name = string("op_1805"), val = tensor([1, 77, -1, 64])]; tensor var_1806_cast_fp16 = reshape(shape = var_1805, x = linear_180_cast_fp16)[name = string("op_1806_cast_fp16")]; tensor var_1808 = const()[name = string("op_1808"), val = tensor([1, 77, -1, 64])]; tensor var_1809_cast_fp16 = reshape(shape = var_1808, x = linear_181_cast_fp16)[name = string("op_1809_cast_fp16")]; tensor var_1811 = const()[name = string("op_1811"), val = tensor([1, 77, -1, 64])]; tensor var_1812_cast_fp16 = reshape(shape = var_1811, x = linear_182_cast_fp16)[name = string("op_1812_cast_fp16")]; tensor value_61_perm_0 = const()[name = string("value_61_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_61_cast_fp16 = mul(x = var_1806_cast_fp16, y = var_11_to_fp16)[name = string("mul_61_cast_fp16")]; bool matmul_30_transpose_y_0 = const()[name = string("matmul_30_transpose_y_0"), val = bool(true)]; bool matmul_30_transpose_x_0 = const()[name = string("matmul_30_transpose_x_0"), val = bool(false)]; tensor transpose_188_perm_0 = const()[name = string("transpose_188_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_189_perm_0 = const()[name = string("transpose_189_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_189 = transpose(perm = transpose_189_perm_0, x = var_1809_cast_fp16)[name = string("transpose_198")]; tensor transpose_188 = transpose(perm = transpose_188_perm_0, x = mul_61_cast_fp16)[name = string("transpose_199")]; tensor matmul_30_cast_fp16 = matmul(transpose_x = matmul_30_transpose_x_0, transpose_y = matmul_30_transpose_y_0, x = transpose_188, y = transpose_189)[name = string("matmul_30_cast_fp16")]; tensor add_30_cast_fp16 = add(x = matmul_30_cast_fp16, y = mul_0_to_fp16)[name = string("add_30_cast_fp16")]; int32 softmax_30_axis_0 = const()[name = string("softmax_30_axis_0"), val = int32(-1)]; tensor softmax_30_cast_fp16 = softmax(axis = softmax_30_axis_0, x = add_30_cast_fp16)[name = string("softmax_30_cast_fp16")]; bool attn_output_121_transpose_x_0 = const()[name = string("attn_output_121_transpose_x_0"), val = bool(false)]; bool attn_output_121_transpose_y_0 = const()[name = string("attn_output_121_transpose_y_0"), val = bool(false)]; tensor value_61_cast_fp16 = transpose(perm = value_61_perm_0, x = var_1812_cast_fp16)[name = string("transpose_197")]; tensor attn_output_121_cast_fp16 = matmul(transpose_x = attn_output_121_transpose_x_0, transpose_y = attn_output_121_transpose_y_0, x = softmax_30_cast_fp16, y = value_61_cast_fp16)[name = string("attn_output_121_cast_fp16")]; tensor var_1815_perm_0 = const()[name = string("op_1815_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1817 = const()[name = string("op_1817"), val = tensor([1, 77, -1])]; tensor var_1815_cast_fp16 = transpose(perm = var_1815_perm_0, x = attn_output_121_cast_fp16)[name = string("transpose_196")]; tensor var_1818_cast_fp16 = reshape(shape = var_1817, x = var_1815_cast_fp16)[name = string("op_1818_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(497940352))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(499169216))))[name = string("encoder_text_model_encoder_layers_30_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(499179520)))]; tensor linear_183_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_self_attn_out_proj_weight_to_fp16_palettized, x = var_1818_cast_fp16)[name = string("linear_183_cast_fp16")]; tensor input_367_cast_fp16 = add(x = input_363_cast_fp16, y = linear_183_cast_fp16)[name = string("input_367_cast_fp16")]; tensor input_369_axes_0 = const()[name = string("input_369_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_30_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(499182144)))]; tensor encoder_text_model_encoder_layers_30_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(499184768)))]; tensor input_369_cast_fp16 = layer_norm(axes = input_369_axes_0, beta = encoder_text_model_encoder_layers_30_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_30_layer_norm2_weight_to_fp16, x = input_367_cast_fp16)[name = string("input_369_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(499187392))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(504102656))))[name = string("encoder_text_model_encoder_layers_30_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(504143680)))]; tensor linear_184_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_mlp_fc1_weight_to_fp16_palettized, x = input_369_cast_fp16)[name = string("linear_184_cast_fp16")]; string input_373_mode_0 = const()[name = string("input_373_mode_0"), val = string("EXACT")]; tensor input_373_cast_fp16 = gelu(mode = input_373_mode_0, x = linear_184_cast_fp16)[name = string("input_373_cast_fp16")]; tensor encoder_text_model_encoder_layers_30_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(504153984))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(509069248))))[name = string("encoder_text_model_encoder_layers_30_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_30_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_30_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(509079552)))]; tensor linear_185_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_30_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_30_mlp_fc2_weight_to_fp16_palettized, x = input_373_cast_fp16)[name = string("linear_185_cast_fp16")]; tensor hidden_embeds = add(x = input_367_cast_fp16, y = linear_185_cast_fp16)[name = string("input_375_cast_fp16")]; tensor hidden_states_187_axes_0 = const()[name = string("hidden_states_187_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_31_layer_norm1_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_layer_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(509082176)))]; tensor encoder_text_model_encoder_layers_31_layer_norm1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_layer_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(509084800)))]; tensor hidden_states_187_cast_fp16 = layer_norm(axes = hidden_states_187_axes_0, beta = encoder_text_model_encoder_layers_31_layer_norm1_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_31_layer_norm1_weight_to_fp16, x = hidden_embeds)[name = string("hidden_states_187_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(509087424))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(510316288))))[name = string("encoder_text_model_encoder_layers_31_self_attn_q_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_self_attn_q_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(510326592)))]; tensor linear_186_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_self_attn_q_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_self_attn_q_proj_weight_to_fp16_palettized, x = hidden_states_187_cast_fp16)[name = string("linear_186_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(510329216))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(511558080))))[name = string("encoder_text_model_encoder_layers_31_self_attn_k_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_self_attn_k_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(511568384)))]; tensor linear_187_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_self_attn_k_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_self_attn_k_proj_weight_to_fp16_palettized, x = hidden_states_187_cast_fp16)[name = string("linear_187_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(511571008))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(512799872))))[name = string("encoder_text_model_encoder_layers_31_self_attn_v_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_self_attn_v_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(512810176)))]; tensor linear_188_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_self_attn_v_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_self_attn_v_proj_weight_to_fp16_palettized, x = hidden_states_187_cast_fp16)[name = string("linear_188_cast_fp16")]; tensor var_1861 = const()[name = string("op_1861"), val = tensor([1, 77, -1, 64])]; tensor var_1862_cast_fp16 = reshape(shape = var_1861, x = linear_186_cast_fp16)[name = string("op_1862_cast_fp16")]; tensor var_1864 = const()[name = string("op_1864"), val = tensor([1, 77, -1, 64])]; tensor var_1865_cast_fp16 = reshape(shape = var_1864, x = linear_187_cast_fp16)[name = string("op_1865_cast_fp16")]; tensor var_1867 = const()[name = string("op_1867"), val = tensor([1, 77, -1, 64])]; tensor var_1868_cast_fp16 = reshape(shape = var_1867, x = linear_188_cast_fp16)[name = string("op_1868_cast_fp16")]; tensor value_perm_0 = const()[name = string("value_perm_0"), val = tensor([0, 2, -3, -1])]; tensor mul_63_cast_fp16 = mul(x = var_1862_cast_fp16, y = var_11_to_fp16)[name = string("mul_63_cast_fp16")]; bool matmul_31_transpose_y_0 = const()[name = string("matmul_31_transpose_y_0"), val = bool(true)]; bool matmul_31_transpose_x_0 = const()[name = string("matmul_31_transpose_x_0"), val = bool(false)]; tensor transpose_190_perm_0 = const()[name = string("transpose_190_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_191_perm_0 = const()[name = string("transpose_191_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_191 = transpose(perm = transpose_191_perm_0, x = var_1865_cast_fp16)[name = string("transpose_194")]; tensor transpose_190 = transpose(perm = transpose_190_perm_0, x = mul_63_cast_fp16)[name = string("transpose_195")]; tensor matmul_31_cast_fp16 = matmul(transpose_x = matmul_31_transpose_x_0, transpose_y = matmul_31_transpose_y_0, x = transpose_190, y = transpose_191)[name = string("matmul_31_cast_fp16")]; tensor add_31_cast_fp16 = add(x = matmul_31_cast_fp16, y = mul_0_to_fp16)[name = string("add_31_cast_fp16")]; int32 softmax_31_axis_0 = const()[name = string("softmax_31_axis_0"), val = int32(-1)]; tensor softmax_31_cast_fp16 = softmax(axis = softmax_31_axis_0, x = add_31_cast_fp16)[name = string("softmax_31_cast_fp16")]; bool attn_output_125_transpose_x_0 = const()[name = string("attn_output_125_transpose_x_0"), val = bool(false)]; bool attn_output_125_transpose_y_0 = const()[name = string("attn_output_125_transpose_y_0"), val = bool(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = var_1868_cast_fp16)[name = string("transpose_193")]; tensor attn_output_125_cast_fp16 = matmul(transpose_x = attn_output_125_transpose_x_0, transpose_y = attn_output_125_transpose_y_0, x = softmax_31_cast_fp16, y = value_cast_fp16)[name = string("attn_output_125_cast_fp16")]; tensor var_1871_perm_0 = const()[name = string("op_1871_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1873 = const()[name = string("op_1873"), val = tensor([1, 77, -1])]; tensor var_1871_cast_fp16 = transpose(perm = var_1871_perm_0, x = attn_output_125_cast_fp16)[name = string("transpose_192")]; tensor var_1874_cast_fp16 = reshape(shape = var_1873, x = var_1871_cast_fp16)[name = string("op_1874_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(512812800))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(514041664))))[name = string("encoder_text_model_encoder_layers_31_self_attn_out_proj_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_self_attn_out_proj_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(514051968)))]; tensor linear_189_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_self_attn_out_proj_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_self_attn_out_proj_weight_to_fp16_palettized, x = var_1874_cast_fp16)[name = string("linear_189_cast_fp16")]; tensor input_379_cast_fp16 = add(x = hidden_embeds, y = linear_189_cast_fp16)[name = string("input_379_cast_fp16")]; tensor input_381_axes_0 = const()[name = string("input_381_axes_0"), val = tensor([-1])]; tensor encoder_text_model_encoder_layers_31_layer_norm2_weight_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_layer_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(514054592)))]; tensor encoder_text_model_encoder_layers_31_layer_norm2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_layer_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(514057216)))]; tensor input_381_cast_fp16 = layer_norm(axes = input_381_axes_0, beta = encoder_text_model_encoder_layers_31_layer_norm2_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_encoder_layers_31_layer_norm2_weight_to_fp16, x = input_379_cast_fp16)[name = string("input_381_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_mlp_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(514059840))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(518975104))))[name = string("encoder_text_model_encoder_layers_31_mlp_fc1_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_mlp_fc1_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_mlp_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(519016128)))]; tensor linear_190_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_mlp_fc1_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_mlp_fc1_weight_to_fp16_palettized, x = input_381_cast_fp16)[name = string("linear_190_cast_fp16")]; string input_385_mode_0 = const()[name = string("input_385_mode_0"), val = string("EXACT")]; tensor input_385_cast_fp16 = gelu(mode = input_385_mode_0, x = linear_190_cast_fp16)[name = string("input_385_cast_fp16")]; tensor encoder_text_model_encoder_layers_31_mlp_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(519026432))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(523941696))))[name = string("encoder_text_model_encoder_layers_31_mlp_fc2_weight_to_fp16_palettized")]; tensor encoder_text_model_encoder_layers_31_mlp_fc2_bias_to_fp16 = const()[name = string("encoder_text_model_encoder_layers_31_mlp_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(523952000)))]; tensor linear_191_cast_fp16 = linear(bias = encoder_text_model_encoder_layers_31_mlp_fc2_bias_to_fp16, weight = encoder_text_model_encoder_layers_31_mlp_fc2_weight_to_fp16_palettized, x = input_385_cast_fp16)[name = string("linear_191_cast_fp16")]; tensor input_387_cast_fp16 = add(x = input_379_cast_fp16, y = linear_191_cast_fp16)[name = string("input_387_cast_fp16")]; tensor last_hidden_state_axes_0 = const()[name = string("last_hidden_state_axes_0"), val = tensor([-1])]; tensor encoder_text_model_final_layer_norm_weight_to_fp16 = const()[name = string("encoder_text_model_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(523954624)))]; tensor encoder_text_model_final_layer_norm_bias_to_fp16 = const()[name = string("encoder_text_model_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(523957248)))]; tensor last_hidden_state_cast_fp16 = layer_norm(axes = last_hidden_state_axes_0, beta = encoder_text_model_final_layer_norm_bias_to_fp16, epsilon = var_9_to_fp16, gamma = encoder_text_model_final_layer_norm_weight_to_fp16, x = input_387_cast_fp16)[name = string("last_hidden_state_cast_fp16")]; tensor var_1902 = const()[name = string("op_1902"), val = tensor([0])]; int32 var_1904_axis_0 = const()[name = string("op_1904_axis_0"), val = int32(-1)]; bool var_1904_keep_dims_0 = const()[name = string("op_1904_keep_dims_0"), val = bool(false)]; string var_1904_output_dtype_0 = const()[name = string("op_1904_output_dtype_0"), val = string("int32")]; tensor var_1904 = reduce_argmax(axis = var_1904_axis_0, keep_dims = var_1904_keep_dims_0, output_dtype = var_1904_output_dtype_0, x = input_ids)[name = string("op_1904")]; int32 stack_0_axis_0 = const()[name = string("stack_0_axis_0"), val = int32(1)]; tensor stack_0 = stack(axis = stack_0_axis_0, values = (var_1902, var_1904))[name = string("stack_0")]; int32 input_transpose_batch_dims_0 = const()[name = string("input_transpose_batch_dims_0"), val = int32(0)]; bool input_transpose_validate_indices_0 = const()[name = string("input_transpose_validate_indices_0"), val = bool(false)]; string stack_0_to_uint16_dtype_0 = const()[name = string("stack_0_to_uint16_dtype_0"), val = string("uint16")]; tensor stack_0_to_uint16 = cast(dtype = stack_0_to_uint16_dtype_0, x = stack_0)[name = string("cast_0")]; tensor input_transpose_cast_fp16_cast_uint16 = gather_nd(batch_dims = input_transpose_batch_dims_0, indices = stack_0_to_uint16, validate_indices = input_transpose_validate_indices_0, x = last_hidden_state_cast_fp16)[name = string("input_transpose_cast_fp16_cast_uint16")]; tensor encoder_text_projection_weight_to_fp16_palettized = constexpr_lut_to_dense(indices = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(523959872))), lut = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(525188736))))[name = string("encoder_text_projection_weight_to_fp16_palettized")]; tensor linear_192_bias_0_to_fp16 = const()[name = string("linear_192_bias_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(525199040)))]; tensor pooled_outputs = linear(bias = linear_192_bias_0_to_fp16, weight = encoder_text_projection_weight_to_fp16_palettized, x = input_transpose_cast_fp16_cast_uint16)[name = string("linear_192_cast_fp16")]; } -> (hidden_embeds, pooled_outputs); }