program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3510.2.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.9.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor image) { tensor image__scaled___y_0 = const()[name = tensor("image__scaled___y_0"), val = tensor(0x1.de5c7ap-7)]; tensor image__scaled__ = mul(x = image, y = image__scaled___y_0)[name = tensor("image__scaled__")]; tensor image__biased___y_0 = const()[name = tensor("image__biased___y_0"), val = tensor([[[[-0x1.cad1b8p+0]], [[-0x1.c0897p+0]], [[-0x1.7aefaep+0]]]])]; tensor image__biased__ = add(x = image__scaled__, y = image__biased___y_0)[name = tensor("image__biased__")]; tensor var_20 = const()[name = tensor("op_20"), val = tensor(1)]; tensor x_1_pad_type_0 = const()[name = tensor("x_1_pad_type_0"), val = tensor("valid")]; tensor x_1_strides_0 = const()[name = tensor("x_1_strides_0"), val = tensor([32, 32])]; tensor x_1_pad_0 = const()[name = tensor("x_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor x_1_dilations_0 = const()[name = tensor("x_1_dilations_0"), val = tensor([1, 1])]; tensor x_1_groups_0 = const()[name = tensor("x_1_groups_0"), val = tensor(1)]; tensor image_to_fp16_dtype_0 = const()[name = tensor("image_to_fp16_dtype_0"), val = tensor("fp16")]; tensor model_visual_conv1_weight_to_fp16 = const()[name = tensor("model_visual_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor image_to_fp16 = cast(dtype = image_to_fp16_dtype_0, x = image__biased__)[name = tensor("cast_135")]; tensor x_1_cast_fp16 = conv(dilations = x_1_dilations_0, groups = x_1_groups_0, pad = x_1_pad_0, pad_type = x_1_pad_type_0, strides = x_1_strides_0, weight = model_visual_conv1_weight_to_fp16, x = image_to_fp16)[name = tensor("x_1_cast_fp16")]; tensor var_38 = const()[name = tensor("op_38"), val = tensor([1, 768, -1])]; tensor x_3_cast_fp16 = reshape(shape = var_38, x = x_1_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_40 = const()[name = tensor("op_40"), val = tensor([0, 2, 1])]; tensor x_7_interleave_0 = const()[name = tensor("x_7_interleave_0"), val = tensor(false)]; tensor const_3_to_fp16 = const()[name = tensor("const_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4718720)))]; tensor x_5_cast_fp16 = transpose(perm = var_40, x = x_3_cast_fp16)[name = tensor("transpose_85")]; tensor x_7_cast_fp16 = concat(axis = var_20, interleave = x_7_interleave_0, values = (const_3_to_fp16, x_5_cast_fp16))[name = tensor("x_7_cast_fp16")]; tensor const_4_to_fp16 = const()[name = tensor("const_4_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4720320)))]; tensor input_1_cast_fp16 = add(x = x_7_cast_fp16, y = const_4_to_fp16)[name = tensor("input_1_cast_fp16")]; tensor x_9_axes_0 = const()[name = tensor("x_9_axes_0"), val = tensor([-1])]; tensor model_visual_ln_pre_weight_to_fp16 = const()[name = tensor("model_visual_ln_pre_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4797184)))]; tensor model_visual_ln_pre_bias_to_fp16 = const()[name = tensor("model_visual_ln_pre_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4798784)))]; tensor var_13_to_fp16 = const()[name = tensor("op_13_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_9_cast_fp16 = layer_norm(axes = x_9_axes_0, beta = model_visual_ln_pre_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_ln_pre_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("x_9_cast_fp16")]; tensor x_11_axes_0 = const()[name = tensor("x_11_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_0_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4800384)))]; tensor model_visual_transformer_resblocks_0_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4801984)))]; tensor x_11_cast_fp16 = layer_norm(axes = x_11_axes_0, beta = model_visual_transformer_resblocks_0_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_0_ln_1_weight_to_fp16, x = x_9_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor query_3_perm_0 = const()[name = tensor("query_3_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_0_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4803584)))]; tensor model_visual_transformer_resblocks_0_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8342592)))]; tensor query_3_cast_fp16 = transpose(perm = query_3_perm_0, x = x_11_cast_fp16)[name = tensor("transpose_84")]; tensor linear_0_cast_fp16 = linear(bias = model_visual_transformer_resblocks_0_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_0_attn_in_proj_weight_to_fp16, x = query_3_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([50, 1, 3, 768])]; tensor var_113_cast_fp16 = reshape(shape = concat_1, x = linear_0_cast_fp16)[name = tensor("op_113_cast_fp16")]; tensor var_114_axes_0 = const()[name = tensor("op_114_axes_0"), val = tensor([0])]; tensor var_114_cast_fp16 = expand_dims(axes = var_114_axes_0, x = var_113_cast_fp16)[name = tensor("op_114_cast_fp16")]; tensor var_115_perm_0 = const()[name = tensor("op_115_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_116_axes_0 = const()[name = tensor("op_116_axes_0"), val = tensor([-2])]; tensor var_115_cast_fp16 = transpose(perm = var_115_perm_0, x = var_114_cast_fp16)[name = tensor("transpose_83")]; tensor var_116_cast_fp16 = squeeze(axes = var_116_axes_0, x = var_115_cast_fp16)[name = tensor("op_116_cast_fp16")]; tensor q_1_begin_0 = const()[name = tensor("q_1_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_1_end_0 = const()[name = tensor("q_1_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_1_end_mask_0 = const()[name = tensor("q_1_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_1_squeeze_mask_0 = const()[name = tensor("q_1_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_1_cast_fp16 = slice_by_index(begin = q_1_begin_0, end = q_1_end_0, end_mask = q_1_end_mask_0, squeeze_mask = q_1_squeeze_mask_0, x = var_116_cast_fp16)[name = tensor("q_1_cast_fp16")]; tensor k_1_begin_0 = const()[name = tensor("k_1_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_1_end_0 = const()[name = tensor("k_1_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_1_end_mask_0 = const()[name = tensor("k_1_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_1_squeeze_mask_0 = const()[name = tensor("k_1_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_1_cast_fp16 = slice_by_index(begin = k_1_begin_0, end = k_1_end_0, end_mask = k_1_end_mask_0, squeeze_mask = k_1_squeeze_mask_0, x = var_116_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor v_1_begin_0 = const()[name = tensor("v_1_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_1_end_0 = const()[name = tensor("v_1_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_1_end_mask_0 = const()[name = tensor("v_1_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_1_squeeze_mask_0 = const()[name = tensor("v_1_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_1_cast_fp16 = slice_by_index(begin = v_1_begin_0, end = v_1_end_0, end_mask = v_1_end_mask_0, squeeze_mask = v_1_squeeze_mask_0, x = var_116_cast_fp16)[name = tensor("v_1_cast_fp16")]; tensor var_124 = const()[name = tensor("op_124"), val = tensor([50, 12, 64])]; tensor var_125_cast_fp16 = reshape(shape = var_124, x = q_1_cast_fp16)[name = tensor("op_125_cast_fp16")]; tensor q_3_perm_0 = const()[name = tensor("q_3_perm_0"), val = tensor([1, 0, 2])]; tensor var_131 = const()[name = tensor("op_131"), val = tensor([50, 12, 64])]; tensor var_132_cast_fp16 = reshape(shape = var_131, x = k_1_cast_fp16)[name = tensor("op_132_cast_fp16")]; tensor k_3_perm_0 = const()[name = tensor("k_3_perm_0"), val = tensor([1, 0, 2])]; tensor var_138 = const()[name = tensor("op_138"), val = tensor([50, 12, 64])]; tensor var_139_cast_fp16 = reshape(shape = var_138, x = v_1_cast_fp16)[name = tensor("op_139_cast_fp16")]; tensor v_3_perm_0 = const()[name = tensor("v_3_perm_0"), val = tensor([1, 0, 2])]; tensor var_142 = const()[name = tensor("op_142"), val = tensor([1, 12, 50, 64])]; tensor q_3_cast_fp16 = transpose(perm = q_3_perm_0, x = var_125_cast_fp16)[name = tensor("transpose_82")]; tensor q_5_cast_fp16 = reshape(shape = var_142, x = q_3_cast_fp16)[name = tensor("q_5_cast_fp16")]; tensor var_144 = const()[name = tensor("op_144"), val = tensor([1, 12, 50, 64])]; tensor k_3_cast_fp16 = transpose(perm = k_3_perm_0, x = var_132_cast_fp16)[name = tensor("transpose_81")]; tensor k_5_cast_fp16 = reshape(shape = var_144, x = k_3_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor var_146 = const()[name = tensor("op_146"), val = tensor([1, 12, 50, 64])]; tensor v_3_cast_fp16 = transpose(perm = v_3_perm_0, x = var_139_cast_fp16)[name = tensor("transpose_80")]; tensor v_5_cast_fp16 = reshape(shape = var_146, x = v_3_cast_fp16)[name = tensor("v_5_cast_fp16")]; tensor mul_1_y_0_to_fp16 = const()[name = tensor("mul_1_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_1_cast_fp16 = mul(x = q_5_cast_fp16, y = mul_1_y_0_to_fp16)[name = tensor("mul_1_cast_fp16")]; tensor matmul_0_transpose_y_0 = const()[name = tensor("matmul_0_transpose_y_0"), val = tensor(true)]; tensor matmul_0_transpose_x_0 = const()[name = tensor("matmul_0_transpose_x_0"), val = tensor(false)]; tensor matmul_0_cast_fp16 = matmul(transpose_x = matmul_0_transpose_x_0, transpose_y = matmul_0_transpose_y_0, x = mul_1_cast_fp16, y = k_5_cast_fp16)[name = tensor("matmul_0_cast_fp16")]; tensor softmax_0_axis_0 = const()[name = tensor("softmax_0_axis_0"), val = tensor(-1)]; tensor softmax_0_cast_fp16 = softmax(axis = softmax_0_axis_0, x = matmul_0_cast_fp16)[name = tensor("softmax_0_cast_fp16")]; tensor attn_output_1_transpose_x_0 = const()[name = tensor("attn_output_1_transpose_x_0"), val = tensor(false)]; tensor attn_output_1_transpose_y_0 = const()[name = tensor("attn_output_1_transpose_y_0"), val = tensor(false)]; tensor attn_output_1_cast_fp16 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = softmax_0_cast_fp16, y = v_5_cast_fp16)[name = tensor("attn_output_1_cast_fp16")]; tensor var_149 = const()[name = tensor("op_149"), val = tensor([2, 0, 1, 3])]; tensor var_154 = const()[name = tensor("op_154"), val = tensor([50, 768])]; tensor var_150_cast_fp16 = transpose(perm = var_149, x = attn_output_1_cast_fp16)[name = tensor("transpose_79")]; tensor attn_output_3_cast_fp16 = reshape(shape = var_154, x = var_150_cast_fp16)[name = tensor("attn_output_3_cast_fp16")]; tensor model_visual_transformer_resblocks_0_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8347264)))]; tensor model_visual_transformer_resblocks_0_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9526976)))]; tensor linear_1_cast_fp16 = linear(bias = model_visual_transformer_resblocks_0_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_0_attn_out_proj_weight_to_fp16, x = attn_output_3_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor var_158 = const()[name = tensor("op_158"), val = tensor([50, 1, 768])]; tensor attn_output_7_cast_fp16 = reshape(shape = var_158, x = linear_1_cast_fp16)[name = tensor("attn_output_7_cast_fp16")]; tensor var_160_perm_0 = const()[name = tensor("op_160_perm_0"), val = tensor([1, 0, 2])]; tensor var_160_cast_fp16 = transpose(perm = var_160_perm_0, x = attn_output_7_cast_fp16)[name = tensor("transpose_78")]; tensor input_5_cast_fp16 = add(x = x_9_cast_fp16, y = var_160_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor x_13_axes_0 = const()[name = tensor("x_13_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_0_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9528576)))]; tensor model_visual_transformer_resblocks_0_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9530176)))]; tensor x_13_cast_fp16 = layer_norm(axes = x_13_axes_0, beta = model_visual_transformer_resblocks_0_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_0_ln_2_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor model_visual_transformer_resblocks_0_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9531776)))]; tensor model_visual_transformer_resblocks_0_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14250432)))]; tensor linear_2_cast_fp16 = linear(bias = model_visual_transformer_resblocks_0_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_0_mlp_c_fc_weight_to_fp16, x = x_13_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11_cast_fp16 = gelu(mode = input_11_mode_0, x = linear_2_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor model_visual_transformer_resblocks_0_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14256640)))]; tensor model_visual_transformer_resblocks_0_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_0_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18975296)))]; tensor linear_3_cast_fp16 = linear(bias = model_visual_transformer_resblocks_0_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_0_mlp_c_proj_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor input_13_cast_fp16 = add(x = input_5_cast_fp16, y = linear_3_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor x_15_axes_0 = const()[name = tensor("x_15_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_1_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18976896)))]; tensor model_visual_transformer_resblocks_1_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18978496)))]; tensor x_15_cast_fp16 = layer_norm(axes = x_15_axes_0, beta = model_visual_transformer_resblocks_1_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_1_ln_1_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("x_15_cast_fp16")]; tensor query_7_perm_0 = const()[name = tensor("query_7_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_1_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18980096)))]; tensor model_visual_transformer_resblocks_1_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22519104)))]; tensor query_7_cast_fp16 = transpose(perm = query_7_perm_0, x = x_15_cast_fp16)[name = tensor("transpose_77")]; tensor linear_4_cast_fp16 = linear(bias = model_visual_transformer_resblocks_1_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_1_attn_in_proj_weight_to_fp16, x = query_7_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([50, 1, 3, 768])]; tensor var_209_cast_fp16 = reshape(shape = concat_2, x = linear_4_cast_fp16)[name = tensor("op_209_cast_fp16")]; tensor var_210_axes_0 = const()[name = tensor("op_210_axes_0"), val = tensor([0])]; tensor var_210_cast_fp16 = expand_dims(axes = var_210_axes_0, x = var_209_cast_fp16)[name = tensor("op_210_cast_fp16")]; tensor var_211_perm_0 = const()[name = tensor("op_211_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_212_axes_0 = const()[name = tensor("op_212_axes_0"), val = tensor([-2])]; tensor var_211_cast_fp16 = transpose(perm = var_211_perm_0, x = var_210_cast_fp16)[name = tensor("transpose_76")]; tensor var_212_cast_fp16 = squeeze(axes = var_212_axes_0, x = var_211_cast_fp16)[name = tensor("op_212_cast_fp16")]; tensor q_7_begin_0 = const()[name = tensor("q_7_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_7_end_0 = const()[name = tensor("q_7_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_7_end_mask_0 = const()[name = tensor("q_7_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_7_squeeze_mask_0 = const()[name = tensor("q_7_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_7_cast_fp16 = slice_by_index(begin = q_7_begin_0, end = q_7_end_0, end_mask = q_7_end_mask_0, squeeze_mask = q_7_squeeze_mask_0, x = var_212_cast_fp16)[name = tensor("q_7_cast_fp16")]; tensor k_7_begin_0 = const()[name = tensor("k_7_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_7_end_0 = const()[name = tensor("k_7_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_7_end_mask_0 = const()[name = tensor("k_7_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_7_squeeze_mask_0 = const()[name = tensor("k_7_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_7_cast_fp16 = slice_by_index(begin = k_7_begin_0, end = k_7_end_0, end_mask = k_7_end_mask_0, squeeze_mask = k_7_squeeze_mask_0, x = var_212_cast_fp16)[name = tensor("k_7_cast_fp16")]; tensor v_7_begin_0 = const()[name = tensor("v_7_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_7_end_0 = const()[name = tensor("v_7_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_7_end_mask_0 = const()[name = tensor("v_7_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_7_squeeze_mask_0 = const()[name = tensor("v_7_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_7_cast_fp16 = slice_by_index(begin = v_7_begin_0, end = v_7_end_0, end_mask = v_7_end_mask_0, squeeze_mask = v_7_squeeze_mask_0, x = var_212_cast_fp16)[name = tensor("v_7_cast_fp16")]; tensor var_220 = const()[name = tensor("op_220"), val = tensor([50, 12, 64])]; tensor var_221_cast_fp16 = reshape(shape = var_220, x = q_7_cast_fp16)[name = tensor("op_221_cast_fp16")]; tensor q_9_perm_0 = const()[name = tensor("q_9_perm_0"), val = tensor([1, 0, 2])]; tensor var_227 = const()[name = tensor("op_227"), val = tensor([50, 12, 64])]; tensor var_228_cast_fp16 = reshape(shape = var_227, x = k_7_cast_fp16)[name = tensor("op_228_cast_fp16")]; tensor k_9_perm_0 = const()[name = tensor("k_9_perm_0"), val = tensor([1, 0, 2])]; tensor var_234 = const()[name = tensor("op_234"), val = tensor([50, 12, 64])]; tensor var_235_cast_fp16 = reshape(shape = var_234, x = v_7_cast_fp16)[name = tensor("op_235_cast_fp16")]; tensor v_9_perm_0 = const()[name = tensor("v_9_perm_0"), val = tensor([1, 0, 2])]; tensor var_238 = const()[name = tensor("op_238"), val = tensor([1, 12, 50, 64])]; tensor q_9_cast_fp16 = transpose(perm = q_9_perm_0, x = var_221_cast_fp16)[name = tensor("transpose_75")]; tensor q_11_cast_fp16 = reshape(shape = var_238, x = q_9_cast_fp16)[name = tensor("q_11_cast_fp16")]; tensor var_240 = const()[name = tensor("op_240"), val = tensor([1, 12, 50, 64])]; tensor k_9_cast_fp16 = transpose(perm = k_9_perm_0, x = var_228_cast_fp16)[name = tensor("transpose_74")]; tensor k_11_cast_fp16 = reshape(shape = var_240, x = k_9_cast_fp16)[name = tensor("k_11_cast_fp16")]; tensor var_242 = const()[name = tensor("op_242"), val = tensor([1, 12, 50, 64])]; tensor v_9_cast_fp16 = transpose(perm = v_9_perm_0, x = var_235_cast_fp16)[name = tensor("transpose_73")]; tensor v_11_cast_fp16 = reshape(shape = var_242, x = v_9_cast_fp16)[name = tensor("v_11_cast_fp16")]; tensor mul_3_y_0_to_fp16 = const()[name = tensor("mul_3_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_3_cast_fp16 = mul(x = q_11_cast_fp16, y = mul_3_y_0_to_fp16)[name = tensor("mul_3_cast_fp16")]; tensor matmul_1_transpose_y_0 = const()[name = tensor("matmul_1_transpose_y_0"), val = tensor(true)]; tensor matmul_1_transpose_x_0 = const()[name = tensor("matmul_1_transpose_x_0"), val = tensor(false)]; tensor matmul_1_cast_fp16 = matmul(transpose_x = matmul_1_transpose_x_0, transpose_y = matmul_1_transpose_y_0, x = mul_3_cast_fp16, y = k_11_cast_fp16)[name = tensor("matmul_1_cast_fp16")]; tensor softmax_1_axis_0 = const()[name = tensor("softmax_1_axis_0"), val = tensor(-1)]; tensor softmax_1_cast_fp16 = softmax(axis = softmax_1_axis_0, x = matmul_1_cast_fp16)[name = tensor("softmax_1_cast_fp16")]; tensor attn_output_9_transpose_x_0 = const()[name = tensor("attn_output_9_transpose_x_0"), val = tensor(false)]; tensor attn_output_9_transpose_y_0 = const()[name = tensor("attn_output_9_transpose_y_0"), val = tensor(false)]; tensor attn_output_9_cast_fp16 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = softmax_1_cast_fp16, y = v_11_cast_fp16)[name = tensor("attn_output_9_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor([2, 0, 1, 3])]; tensor var_250 = const()[name = tensor("op_250"), val = tensor([50, 768])]; tensor var_246_cast_fp16 = transpose(perm = var_245, x = attn_output_9_cast_fp16)[name = tensor("transpose_72")]; tensor attn_output_11_cast_fp16 = reshape(shape = var_250, x = var_246_cast_fp16)[name = tensor("attn_output_11_cast_fp16")]; tensor model_visual_transformer_resblocks_1_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22523776)))]; tensor model_visual_transformer_resblocks_1_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23703488)))]; tensor linear_5_cast_fp16 = linear(bias = model_visual_transformer_resblocks_1_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_1_attn_out_proj_weight_to_fp16, x = attn_output_11_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_254 = const()[name = tensor("op_254"), val = tensor([50, 1, 768])]; tensor attn_output_15_cast_fp16 = reshape(shape = var_254, x = linear_5_cast_fp16)[name = tensor("attn_output_15_cast_fp16")]; tensor var_256_perm_0 = const()[name = tensor("op_256_perm_0"), val = tensor([1, 0, 2])]; tensor var_256_cast_fp16 = transpose(perm = var_256_perm_0, x = attn_output_15_cast_fp16)[name = tensor("transpose_71")]; tensor input_15_cast_fp16 = add(x = input_13_cast_fp16, y = var_256_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor x_17_axes_0 = const()[name = tensor("x_17_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_1_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23705088)))]; tensor model_visual_transformer_resblocks_1_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23706688)))]; tensor x_17_cast_fp16 = layer_norm(axes = x_17_axes_0, beta = model_visual_transformer_resblocks_1_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_1_ln_2_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor model_visual_transformer_resblocks_1_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23708288)))]; tensor model_visual_transformer_resblocks_1_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28426944)))]; tensor linear_6_cast_fp16 = linear(bias = model_visual_transformer_resblocks_1_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_1_mlp_c_fc_weight_to_fp16, x = x_17_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("EXACT")]; tensor input_21_cast_fp16 = gelu(mode = input_21_mode_0, x = linear_6_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor model_visual_transformer_resblocks_1_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28433152)))]; tensor model_visual_transformer_resblocks_1_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_1_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33151808)))]; tensor linear_7_cast_fp16 = linear(bias = model_visual_transformer_resblocks_1_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_1_mlp_c_proj_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor input_23_cast_fp16 = add(x = input_15_cast_fp16, y = linear_7_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor x_19_axes_0 = const()[name = tensor("x_19_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_2_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33153408)))]; tensor model_visual_transformer_resblocks_2_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33155008)))]; tensor x_19_cast_fp16 = layer_norm(axes = x_19_axes_0, beta = model_visual_transformer_resblocks_2_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_2_ln_1_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor query_11_perm_0 = const()[name = tensor("query_11_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_2_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33156608)))]; tensor model_visual_transformer_resblocks_2_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36695616)))]; tensor query_11_cast_fp16 = transpose(perm = query_11_perm_0, x = x_19_cast_fp16)[name = tensor("transpose_70")]; tensor linear_8_cast_fp16 = linear(bias = model_visual_transformer_resblocks_2_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_2_attn_in_proj_weight_to_fp16, x = query_11_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([50, 1, 3, 768])]; tensor var_305_cast_fp16 = reshape(shape = concat_3, x = linear_8_cast_fp16)[name = tensor("op_305_cast_fp16")]; tensor var_306_axes_0 = const()[name = tensor("op_306_axes_0"), val = tensor([0])]; tensor var_306_cast_fp16 = expand_dims(axes = var_306_axes_0, x = var_305_cast_fp16)[name = tensor("op_306_cast_fp16")]; tensor var_307_perm_0 = const()[name = tensor("op_307_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_308_axes_0 = const()[name = tensor("op_308_axes_0"), val = tensor([-2])]; tensor var_307_cast_fp16 = transpose(perm = var_307_perm_0, x = var_306_cast_fp16)[name = tensor("transpose_69")]; tensor var_308_cast_fp16 = squeeze(axes = var_308_axes_0, x = var_307_cast_fp16)[name = tensor("op_308_cast_fp16")]; tensor q_13_begin_0 = const()[name = tensor("q_13_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_13_end_0 = const()[name = tensor("q_13_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_13_end_mask_0 = const()[name = tensor("q_13_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_13_squeeze_mask_0 = const()[name = tensor("q_13_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_13_cast_fp16 = slice_by_index(begin = q_13_begin_0, end = q_13_end_0, end_mask = q_13_end_mask_0, squeeze_mask = q_13_squeeze_mask_0, x = var_308_cast_fp16)[name = tensor("q_13_cast_fp16")]; tensor k_13_begin_0 = const()[name = tensor("k_13_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_13_end_0 = const()[name = tensor("k_13_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_13_end_mask_0 = const()[name = tensor("k_13_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_13_squeeze_mask_0 = const()[name = tensor("k_13_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_13_cast_fp16 = slice_by_index(begin = k_13_begin_0, end = k_13_end_0, end_mask = k_13_end_mask_0, squeeze_mask = k_13_squeeze_mask_0, x = var_308_cast_fp16)[name = tensor("k_13_cast_fp16")]; tensor v_13_begin_0 = const()[name = tensor("v_13_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_13_end_0 = const()[name = tensor("v_13_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_13_end_mask_0 = const()[name = tensor("v_13_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_13_squeeze_mask_0 = const()[name = tensor("v_13_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_13_cast_fp16 = slice_by_index(begin = v_13_begin_0, end = v_13_end_0, end_mask = v_13_end_mask_0, squeeze_mask = v_13_squeeze_mask_0, x = var_308_cast_fp16)[name = tensor("v_13_cast_fp16")]; tensor var_316 = const()[name = tensor("op_316"), val = tensor([50, 12, 64])]; tensor var_317_cast_fp16 = reshape(shape = var_316, x = q_13_cast_fp16)[name = tensor("op_317_cast_fp16")]; tensor q_15_perm_0 = const()[name = tensor("q_15_perm_0"), val = tensor([1, 0, 2])]; tensor var_323 = const()[name = tensor("op_323"), val = tensor([50, 12, 64])]; tensor var_324_cast_fp16 = reshape(shape = var_323, x = k_13_cast_fp16)[name = tensor("op_324_cast_fp16")]; tensor k_15_perm_0 = const()[name = tensor("k_15_perm_0"), val = tensor([1, 0, 2])]; tensor var_330 = const()[name = tensor("op_330"), val = tensor([50, 12, 64])]; tensor var_331_cast_fp16 = reshape(shape = var_330, x = v_13_cast_fp16)[name = tensor("op_331_cast_fp16")]; tensor v_15_perm_0 = const()[name = tensor("v_15_perm_0"), val = tensor([1, 0, 2])]; tensor var_334 = const()[name = tensor("op_334"), val = tensor([1, 12, 50, 64])]; tensor q_15_cast_fp16 = transpose(perm = q_15_perm_0, x = var_317_cast_fp16)[name = tensor("transpose_68")]; tensor q_17_cast_fp16 = reshape(shape = var_334, x = q_15_cast_fp16)[name = tensor("q_17_cast_fp16")]; tensor var_336 = const()[name = tensor("op_336"), val = tensor([1, 12, 50, 64])]; tensor k_15_cast_fp16 = transpose(perm = k_15_perm_0, x = var_324_cast_fp16)[name = tensor("transpose_67")]; tensor k_17_cast_fp16 = reshape(shape = var_336, x = k_15_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor var_338 = const()[name = tensor("op_338"), val = tensor([1, 12, 50, 64])]; tensor v_15_cast_fp16 = transpose(perm = v_15_perm_0, x = var_331_cast_fp16)[name = tensor("transpose_66")]; tensor v_17_cast_fp16 = reshape(shape = var_338, x = v_15_cast_fp16)[name = tensor("v_17_cast_fp16")]; tensor mul_5_y_0_to_fp16 = const()[name = tensor("mul_5_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_5_cast_fp16 = mul(x = q_17_cast_fp16, y = mul_5_y_0_to_fp16)[name = tensor("mul_5_cast_fp16")]; tensor matmul_2_transpose_y_0 = const()[name = tensor("matmul_2_transpose_y_0"), val = tensor(true)]; tensor matmul_2_transpose_x_0 = const()[name = tensor("matmul_2_transpose_x_0"), val = tensor(false)]; tensor matmul_2_cast_fp16 = matmul(transpose_x = matmul_2_transpose_x_0, transpose_y = matmul_2_transpose_y_0, x = mul_5_cast_fp16, y = k_17_cast_fp16)[name = tensor("matmul_2_cast_fp16")]; tensor softmax_2_axis_0 = const()[name = tensor("softmax_2_axis_0"), val = tensor(-1)]; tensor softmax_2_cast_fp16 = softmax(axis = softmax_2_axis_0, x = matmul_2_cast_fp16)[name = tensor("softmax_2_cast_fp16")]; tensor attn_output_17_transpose_x_0 = const()[name = tensor("attn_output_17_transpose_x_0"), val = tensor(false)]; tensor attn_output_17_transpose_y_0 = const()[name = tensor("attn_output_17_transpose_y_0"), val = tensor(false)]; tensor attn_output_17_cast_fp16 = matmul(transpose_x = attn_output_17_transpose_x_0, transpose_y = attn_output_17_transpose_y_0, x = softmax_2_cast_fp16, y = v_17_cast_fp16)[name = tensor("attn_output_17_cast_fp16")]; tensor var_341 = const()[name = tensor("op_341"), val = tensor([2, 0, 1, 3])]; tensor var_346 = const()[name = tensor("op_346"), val = tensor([50, 768])]; tensor var_342_cast_fp16 = transpose(perm = var_341, x = attn_output_17_cast_fp16)[name = tensor("transpose_65")]; tensor attn_output_19_cast_fp16 = reshape(shape = var_346, x = var_342_cast_fp16)[name = tensor("attn_output_19_cast_fp16")]; tensor model_visual_transformer_resblocks_2_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36700288)))]; tensor model_visual_transformer_resblocks_2_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37880000)))]; tensor linear_9_cast_fp16 = linear(bias = model_visual_transformer_resblocks_2_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_2_attn_out_proj_weight_to_fp16, x = attn_output_19_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor var_350 = const()[name = tensor("op_350"), val = tensor([50, 1, 768])]; tensor attn_output_23_cast_fp16 = reshape(shape = var_350, x = linear_9_cast_fp16)[name = tensor("attn_output_23_cast_fp16")]; tensor var_352_perm_0 = const()[name = tensor("op_352_perm_0"), val = tensor([1, 0, 2])]; tensor var_352_cast_fp16 = transpose(perm = var_352_perm_0, x = attn_output_23_cast_fp16)[name = tensor("transpose_64")]; tensor input_25_cast_fp16 = add(x = input_23_cast_fp16, y = var_352_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor x_21_axes_0 = const()[name = tensor("x_21_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_2_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37881600)))]; tensor model_visual_transformer_resblocks_2_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37883200)))]; tensor x_21_cast_fp16 = layer_norm(axes = x_21_axes_0, beta = model_visual_transformer_resblocks_2_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_2_ln_2_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("x_21_cast_fp16")]; tensor model_visual_transformer_resblocks_2_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37884800)))]; tensor model_visual_transformer_resblocks_2_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42603456)))]; tensor linear_10_cast_fp16 = linear(bias = model_visual_transformer_resblocks_2_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_2_mlp_c_fc_weight_to_fp16, x = x_21_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = linear_10_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor model_visual_transformer_resblocks_2_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42609664)))]; tensor model_visual_transformer_resblocks_2_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_2_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47328320)))]; tensor linear_11_cast_fp16 = linear(bias = model_visual_transformer_resblocks_2_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_2_mlp_c_proj_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor input_33_cast_fp16 = add(x = input_25_cast_fp16, y = linear_11_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor x_23_axes_0 = const()[name = tensor("x_23_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_3_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47329920)))]; tensor model_visual_transformer_resblocks_3_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47331520)))]; tensor x_23_cast_fp16 = layer_norm(axes = x_23_axes_0, beta = model_visual_transformer_resblocks_3_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_3_ln_1_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("x_23_cast_fp16")]; tensor query_15_perm_0 = const()[name = tensor("query_15_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_3_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47333120)))]; tensor model_visual_transformer_resblocks_3_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50872128)))]; tensor query_15_cast_fp16 = transpose(perm = query_15_perm_0, x = x_23_cast_fp16)[name = tensor("transpose_63")]; tensor linear_12_cast_fp16 = linear(bias = model_visual_transformer_resblocks_3_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_3_attn_in_proj_weight_to_fp16, x = query_15_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([50, 1, 3, 768])]; tensor var_401_cast_fp16 = reshape(shape = concat_4, x = linear_12_cast_fp16)[name = tensor("op_401_cast_fp16")]; tensor var_402_axes_0 = const()[name = tensor("op_402_axes_0"), val = tensor([0])]; tensor var_402_cast_fp16 = expand_dims(axes = var_402_axes_0, x = var_401_cast_fp16)[name = tensor("op_402_cast_fp16")]; tensor var_403_perm_0 = const()[name = tensor("op_403_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_404_axes_0 = const()[name = tensor("op_404_axes_0"), val = tensor([-2])]; tensor var_403_cast_fp16 = transpose(perm = var_403_perm_0, x = var_402_cast_fp16)[name = tensor("transpose_62")]; tensor var_404_cast_fp16 = squeeze(axes = var_404_axes_0, x = var_403_cast_fp16)[name = tensor("op_404_cast_fp16")]; tensor q_19_begin_0 = const()[name = tensor("q_19_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_19_end_0 = const()[name = tensor("q_19_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_19_end_mask_0 = const()[name = tensor("q_19_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_19_squeeze_mask_0 = const()[name = tensor("q_19_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_19_cast_fp16 = slice_by_index(begin = q_19_begin_0, end = q_19_end_0, end_mask = q_19_end_mask_0, squeeze_mask = q_19_squeeze_mask_0, x = var_404_cast_fp16)[name = tensor("q_19_cast_fp16")]; tensor k_19_begin_0 = const()[name = tensor("k_19_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_19_end_0 = const()[name = tensor("k_19_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_19_end_mask_0 = const()[name = tensor("k_19_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_19_squeeze_mask_0 = const()[name = tensor("k_19_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_19_cast_fp16 = slice_by_index(begin = k_19_begin_0, end = k_19_end_0, end_mask = k_19_end_mask_0, squeeze_mask = k_19_squeeze_mask_0, x = var_404_cast_fp16)[name = tensor("k_19_cast_fp16")]; tensor v_19_begin_0 = const()[name = tensor("v_19_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_19_end_0 = const()[name = tensor("v_19_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_19_end_mask_0 = const()[name = tensor("v_19_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_19_squeeze_mask_0 = const()[name = tensor("v_19_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_19_cast_fp16 = slice_by_index(begin = v_19_begin_0, end = v_19_end_0, end_mask = v_19_end_mask_0, squeeze_mask = v_19_squeeze_mask_0, x = var_404_cast_fp16)[name = tensor("v_19_cast_fp16")]; tensor var_412 = const()[name = tensor("op_412"), val = tensor([50, 12, 64])]; tensor var_413_cast_fp16 = reshape(shape = var_412, x = q_19_cast_fp16)[name = tensor("op_413_cast_fp16")]; tensor q_21_perm_0 = const()[name = tensor("q_21_perm_0"), val = tensor([1, 0, 2])]; tensor var_419 = const()[name = tensor("op_419"), val = tensor([50, 12, 64])]; tensor var_420_cast_fp16 = reshape(shape = var_419, x = k_19_cast_fp16)[name = tensor("op_420_cast_fp16")]; tensor k_21_perm_0 = const()[name = tensor("k_21_perm_0"), val = tensor([1, 0, 2])]; tensor var_426 = const()[name = tensor("op_426"), val = tensor([50, 12, 64])]; tensor var_427_cast_fp16 = reshape(shape = var_426, x = v_19_cast_fp16)[name = tensor("op_427_cast_fp16")]; tensor v_21_perm_0 = const()[name = tensor("v_21_perm_0"), val = tensor([1, 0, 2])]; tensor var_430 = const()[name = tensor("op_430"), val = tensor([1, 12, 50, 64])]; tensor q_21_cast_fp16 = transpose(perm = q_21_perm_0, x = var_413_cast_fp16)[name = tensor("transpose_61")]; tensor q_23_cast_fp16 = reshape(shape = var_430, x = q_21_cast_fp16)[name = tensor("q_23_cast_fp16")]; tensor var_432 = const()[name = tensor("op_432"), val = tensor([1, 12, 50, 64])]; tensor k_21_cast_fp16 = transpose(perm = k_21_perm_0, x = var_420_cast_fp16)[name = tensor("transpose_60")]; tensor k_23_cast_fp16 = reshape(shape = var_432, x = k_21_cast_fp16)[name = tensor("k_23_cast_fp16")]; tensor var_434 = const()[name = tensor("op_434"), val = tensor([1, 12, 50, 64])]; tensor v_21_cast_fp16 = transpose(perm = v_21_perm_0, x = var_427_cast_fp16)[name = tensor("transpose_59")]; tensor v_23_cast_fp16 = reshape(shape = var_434, x = v_21_cast_fp16)[name = tensor("v_23_cast_fp16")]; tensor mul_7_y_0_to_fp16 = const()[name = tensor("mul_7_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_7_cast_fp16 = mul(x = q_23_cast_fp16, y = mul_7_y_0_to_fp16)[name = tensor("mul_7_cast_fp16")]; tensor matmul_3_transpose_y_0 = const()[name = tensor("matmul_3_transpose_y_0"), val = tensor(true)]; tensor matmul_3_transpose_x_0 = const()[name = tensor("matmul_3_transpose_x_0"), val = tensor(false)]; tensor matmul_3_cast_fp16 = matmul(transpose_x = matmul_3_transpose_x_0, transpose_y = matmul_3_transpose_y_0, x = mul_7_cast_fp16, y = k_23_cast_fp16)[name = tensor("matmul_3_cast_fp16")]; tensor softmax_3_axis_0 = const()[name = tensor("softmax_3_axis_0"), val = tensor(-1)]; tensor softmax_3_cast_fp16 = softmax(axis = softmax_3_axis_0, x = matmul_3_cast_fp16)[name = tensor("softmax_3_cast_fp16")]; tensor attn_output_25_transpose_x_0 = const()[name = tensor("attn_output_25_transpose_x_0"), val = tensor(false)]; tensor attn_output_25_transpose_y_0 = const()[name = tensor("attn_output_25_transpose_y_0"), val = tensor(false)]; tensor attn_output_25_cast_fp16 = matmul(transpose_x = attn_output_25_transpose_x_0, transpose_y = attn_output_25_transpose_y_0, x = softmax_3_cast_fp16, y = v_23_cast_fp16)[name = tensor("attn_output_25_cast_fp16")]; tensor var_437 = const()[name = tensor("op_437"), val = tensor([2, 0, 1, 3])]; tensor var_442 = const()[name = tensor("op_442"), val = tensor([50, 768])]; tensor var_438_cast_fp16 = transpose(perm = var_437, x = attn_output_25_cast_fp16)[name = tensor("transpose_58")]; tensor attn_output_27_cast_fp16 = reshape(shape = var_442, x = var_438_cast_fp16)[name = tensor("attn_output_27_cast_fp16")]; tensor model_visual_transformer_resblocks_3_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50876800)))]; tensor model_visual_transformer_resblocks_3_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52056512)))]; tensor linear_13_cast_fp16 = linear(bias = model_visual_transformer_resblocks_3_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_3_attn_out_proj_weight_to_fp16, x = attn_output_27_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_446 = const()[name = tensor("op_446"), val = tensor([50, 1, 768])]; tensor attn_output_31_cast_fp16 = reshape(shape = var_446, x = linear_13_cast_fp16)[name = tensor("attn_output_31_cast_fp16")]; tensor var_448_perm_0 = const()[name = tensor("op_448_perm_0"), val = tensor([1, 0, 2])]; tensor var_448_cast_fp16 = transpose(perm = var_448_perm_0, x = attn_output_31_cast_fp16)[name = tensor("transpose_57")]; tensor input_35_cast_fp16 = add(x = input_33_cast_fp16, y = var_448_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor x_25_axes_0 = const()[name = tensor("x_25_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_3_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52058112)))]; tensor model_visual_transformer_resblocks_3_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52059712)))]; tensor x_25_cast_fp16 = layer_norm(axes = x_25_axes_0, beta = model_visual_transformer_resblocks_3_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_3_ln_2_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor model_visual_transformer_resblocks_3_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52061312)))]; tensor model_visual_transformer_resblocks_3_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(56779968)))]; tensor linear_14_cast_fp16 = linear(bias = model_visual_transformer_resblocks_3_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_3_mlp_c_fc_weight_to_fp16, x = x_25_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("EXACT")]; tensor input_41_cast_fp16 = gelu(mode = input_41_mode_0, x = linear_14_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor model_visual_transformer_resblocks_3_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(56786176)))]; tensor model_visual_transformer_resblocks_3_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_3_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61504832)))]; tensor linear_15_cast_fp16 = linear(bias = model_visual_transformer_resblocks_3_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_3_mlp_c_proj_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor input_43_cast_fp16 = add(x = input_35_cast_fp16, y = linear_15_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor x_27_axes_0 = const()[name = tensor("x_27_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_4_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61506432)))]; tensor model_visual_transformer_resblocks_4_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61508032)))]; tensor x_27_cast_fp16 = layer_norm(axes = x_27_axes_0, beta = model_visual_transformer_resblocks_4_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_4_ln_1_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("x_27_cast_fp16")]; tensor query_19_perm_0 = const()[name = tensor("query_19_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_4_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61509632)))]; tensor model_visual_transformer_resblocks_4_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65048640)))]; tensor query_19_cast_fp16 = transpose(perm = query_19_perm_0, x = x_27_cast_fp16)[name = tensor("transpose_56")]; tensor linear_16_cast_fp16 = linear(bias = model_visual_transformer_resblocks_4_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_4_attn_in_proj_weight_to_fp16, x = query_19_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([50, 1, 3, 768])]; tensor var_497_cast_fp16 = reshape(shape = concat_5, x = linear_16_cast_fp16)[name = tensor("op_497_cast_fp16")]; tensor var_498_axes_0 = const()[name = tensor("op_498_axes_0"), val = tensor([0])]; tensor var_498_cast_fp16 = expand_dims(axes = var_498_axes_0, x = var_497_cast_fp16)[name = tensor("op_498_cast_fp16")]; tensor var_499_perm_0 = const()[name = tensor("op_499_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_500_axes_0 = const()[name = tensor("op_500_axes_0"), val = tensor([-2])]; tensor var_499_cast_fp16 = transpose(perm = var_499_perm_0, x = var_498_cast_fp16)[name = tensor("transpose_55")]; tensor var_500_cast_fp16 = squeeze(axes = var_500_axes_0, x = var_499_cast_fp16)[name = tensor("op_500_cast_fp16")]; tensor q_25_begin_0 = const()[name = tensor("q_25_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_25_end_0 = const()[name = tensor("q_25_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_25_end_mask_0 = const()[name = tensor("q_25_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_25_squeeze_mask_0 = const()[name = tensor("q_25_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_25_cast_fp16 = slice_by_index(begin = q_25_begin_0, end = q_25_end_0, end_mask = q_25_end_mask_0, squeeze_mask = q_25_squeeze_mask_0, x = var_500_cast_fp16)[name = tensor("q_25_cast_fp16")]; tensor k_25_begin_0 = const()[name = tensor("k_25_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_25_end_0 = const()[name = tensor("k_25_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_25_end_mask_0 = const()[name = tensor("k_25_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_25_squeeze_mask_0 = const()[name = tensor("k_25_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_25_cast_fp16 = slice_by_index(begin = k_25_begin_0, end = k_25_end_0, end_mask = k_25_end_mask_0, squeeze_mask = k_25_squeeze_mask_0, x = var_500_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor v_25_begin_0 = const()[name = tensor("v_25_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_25_end_0 = const()[name = tensor("v_25_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_25_end_mask_0 = const()[name = tensor("v_25_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_25_squeeze_mask_0 = const()[name = tensor("v_25_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_25_cast_fp16 = slice_by_index(begin = v_25_begin_0, end = v_25_end_0, end_mask = v_25_end_mask_0, squeeze_mask = v_25_squeeze_mask_0, x = var_500_cast_fp16)[name = tensor("v_25_cast_fp16")]; tensor var_508 = const()[name = tensor("op_508"), val = tensor([50, 12, 64])]; tensor var_509_cast_fp16 = reshape(shape = var_508, x = q_25_cast_fp16)[name = tensor("op_509_cast_fp16")]; tensor q_27_perm_0 = const()[name = tensor("q_27_perm_0"), val = tensor([1, 0, 2])]; tensor var_515 = const()[name = tensor("op_515"), val = tensor([50, 12, 64])]; tensor var_516_cast_fp16 = reshape(shape = var_515, x = k_25_cast_fp16)[name = tensor("op_516_cast_fp16")]; tensor k_27_perm_0 = const()[name = tensor("k_27_perm_0"), val = tensor([1, 0, 2])]; tensor var_522 = const()[name = tensor("op_522"), val = tensor([50, 12, 64])]; tensor var_523_cast_fp16 = reshape(shape = var_522, x = v_25_cast_fp16)[name = tensor("op_523_cast_fp16")]; tensor v_27_perm_0 = const()[name = tensor("v_27_perm_0"), val = tensor([1, 0, 2])]; tensor var_526 = const()[name = tensor("op_526"), val = tensor([1, 12, 50, 64])]; tensor q_27_cast_fp16 = transpose(perm = q_27_perm_0, x = var_509_cast_fp16)[name = tensor("transpose_54")]; tensor q_29_cast_fp16 = reshape(shape = var_526, x = q_27_cast_fp16)[name = tensor("q_29_cast_fp16")]; tensor var_528 = const()[name = tensor("op_528"), val = tensor([1, 12, 50, 64])]; tensor k_27_cast_fp16 = transpose(perm = k_27_perm_0, x = var_516_cast_fp16)[name = tensor("transpose_53")]; tensor k_29_cast_fp16 = reshape(shape = var_528, x = k_27_cast_fp16)[name = tensor("k_29_cast_fp16")]; tensor var_530 = const()[name = tensor("op_530"), val = tensor([1, 12, 50, 64])]; tensor v_27_cast_fp16 = transpose(perm = v_27_perm_0, x = var_523_cast_fp16)[name = tensor("transpose_52")]; tensor v_29_cast_fp16 = reshape(shape = var_530, x = v_27_cast_fp16)[name = tensor("v_29_cast_fp16")]; tensor mul_9_y_0_to_fp16 = const()[name = tensor("mul_9_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_9_cast_fp16 = mul(x = q_29_cast_fp16, y = mul_9_y_0_to_fp16)[name = tensor("mul_9_cast_fp16")]; tensor matmul_4_transpose_y_0 = const()[name = tensor("matmul_4_transpose_y_0"), val = tensor(true)]; tensor matmul_4_transpose_x_0 = const()[name = tensor("matmul_4_transpose_x_0"), val = tensor(false)]; tensor matmul_4_cast_fp16 = matmul(transpose_x = matmul_4_transpose_x_0, transpose_y = matmul_4_transpose_y_0, x = mul_9_cast_fp16, y = k_29_cast_fp16)[name = tensor("matmul_4_cast_fp16")]; tensor softmax_4_axis_0 = const()[name = tensor("softmax_4_axis_0"), val = tensor(-1)]; tensor softmax_4_cast_fp16 = softmax(axis = softmax_4_axis_0, x = matmul_4_cast_fp16)[name = tensor("softmax_4_cast_fp16")]; tensor attn_output_33_transpose_x_0 = const()[name = tensor("attn_output_33_transpose_x_0"), val = tensor(false)]; tensor attn_output_33_transpose_y_0 = const()[name = tensor("attn_output_33_transpose_y_0"), val = tensor(false)]; tensor attn_output_33_cast_fp16 = matmul(transpose_x = attn_output_33_transpose_x_0, transpose_y = attn_output_33_transpose_y_0, x = softmax_4_cast_fp16, y = v_29_cast_fp16)[name = tensor("attn_output_33_cast_fp16")]; tensor var_533 = const()[name = tensor("op_533"), val = tensor([2, 0, 1, 3])]; tensor var_538 = const()[name = tensor("op_538"), val = tensor([50, 768])]; tensor var_534_cast_fp16 = transpose(perm = var_533, x = attn_output_33_cast_fp16)[name = tensor("transpose_51")]; tensor attn_output_35_cast_fp16 = reshape(shape = var_538, x = var_534_cast_fp16)[name = tensor("attn_output_35_cast_fp16")]; tensor model_visual_transformer_resblocks_4_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65053312)))]; tensor model_visual_transformer_resblocks_4_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66233024)))]; tensor linear_17_cast_fp16 = linear(bias = model_visual_transformer_resblocks_4_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_4_attn_out_proj_weight_to_fp16, x = attn_output_35_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor var_542 = const()[name = tensor("op_542"), val = tensor([50, 1, 768])]; tensor attn_output_39_cast_fp16 = reshape(shape = var_542, x = linear_17_cast_fp16)[name = tensor("attn_output_39_cast_fp16")]; tensor var_544_perm_0 = const()[name = tensor("op_544_perm_0"), val = tensor([1, 0, 2])]; tensor var_544_cast_fp16 = transpose(perm = var_544_perm_0, x = attn_output_39_cast_fp16)[name = tensor("transpose_50")]; tensor input_45_cast_fp16 = add(x = input_43_cast_fp16, y = var_544_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor x_29_axes_0 = const()[name = tensor("x_29_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_4_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66234624)))]; tensor model_visual_transformer_resblocks_4_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66236224)))]; tensor x_29_cast_fp16 = layer_norm(axes = x_29_axes_0, beta = model_visual_transformer_resblocks_4_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_4_ln_2_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("x_29_cast_fp16")]; tensor model_visual_transformer_resblocks_4_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66237824)))]; tensor model_visual_transformer_resblocks_4_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70956480)))]; tensor linear_18_cast_fp16 = linear(bias = model_visual_transformer_resblocks_4_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_4_mlp_c_fc_weight_to_fp16, x = x_29_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor input_51_mode_0 = const()[name = tensor("input_51_mode_0"), val = tensor("EXACT")]; tensor input_51_cast_fp16 = gelu(mode = input_51_mode_0, x = linear_18_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor model_visual_transformer_resblocks_4_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70962688)))]; tensor model_visual_transformer_resblocks_4_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_4_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75681344)))]; tensor linear_19_cast_fp16 = linear(bias = model_visual_transformer_resblocks_4_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_4_mlp_c_proj_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor input_53_cast_fp16 = add(x = input_45_cast_fp16, y = linear_19_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor x_31_axes_0 = const()[name = tensor("x_31_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_5_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75682944)))]; tensor model_visual_transformer_resblocks_5_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75684544)))]; tensor x_31_cast_fp16 = layer_norm(axes = x_31_axes_0, beta = model_visual_transformer_resblocks_5_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_5_ln_1_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor query_23_perm_0 = const()[name = tensor("query_23_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_5_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75686144)))]; tensor model_visual_transformer_resblocks_5_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79225152)))]; tensor query_23_cast_fp16 = transpose(perm = query_23_perm_0, x = x_31_cast_fp16)[name = tensor("transpose_49")]; tensor linear_20_cast_fp16 = linear(bias = model_visual_transformer_resblocks_5_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_5_attn_in_proj_weight_to_fp16, x = query_23_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor concat_6 = const()[name = tensor("concat_6"), val = tensor([50, 1, 3, 768])]; tensor var_593_cast_fp16 = reshape(shape = concat_6, x = linear_20_cast_fp16)[name = tensor("op_593_cast_fp16")]; tensor var_594_axes_0 = const()[name = tensor("op_594_axes_0"), val = tensor([0])]; tensor var_594_cast_fp16 = expand_dims(axes = var_594_axes_0, x = var_593_cast_fp16)[name = tensor("op_594_cast_fp16")]; tensor var_595_perm_0 = const()[name = tensor("op_595_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_596_axes_0 = const()[name = tensor("op_596_axes_0"), val = tensor([-2])]; tensor var_595_cast_fp16 = transpose(perm = var_595_perm_0, x = var_594_cast_fp16)[name = tensor("transpose_48")]; tensor var_596_cast_fp16 = squeeze(axes = var_596_axes_0, x = var_595_cast_fp16)[name = tensor("op_596_cast_fp16")]; tensor q_31_begin_0 = const()[name = tensor("q_31_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_31_end_0 = const()[name = tensor("q_31_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_31_end_mask_0 = const()[name = tensor("q_31_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_31_squeeze_mask_0 = const()[name = tensor("q_31_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_31_cast_fp16 = slice_by_index(begin = q_31_begin_0, end = q_31_end_0, end_mask = q_31_end_mask_0, squeeze_mask = q_31_squeeze_mask_0, x = var_596_cast_fp16)[name = tensor("q_31_cast_fp16")]; tensor k_31_begin_0 = const()[name = tensor("k_31_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_31_end_0 = const()[name = tensor("k_31_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_31_end_mask_0 = const()[name = tensor("k_31_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_31_squeeze_mask_0 = const()[name = tensor("k_31_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_31_cast_fp16 = slice_by_index(begin = k_31_begin_0, end = k_31_end_0, end_mask = k_31_end_mask_0, squeeze_mask = k_31_squeeze_mask_0, x = var_596_cast_fp16)[name = tensor("k_31_cast_fp16")]; tensor v_31_begin_0 = const()[name = tensor("v_31_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_31_end_0 = const()[name = tensor("v_31_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_31_end_mask_0 = const()[name = tensor("v_31_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_31_squeeze_mask_0 = const()[name = tensor("v_31_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_31_cast_fp16 = slice_by_index(begin = v_31_begin_0, end = v_31_end_0, end_mask = v_31_end_mask_0, squeeze_mask = v_31_squeeze_mask_0, x = var_596_cast_fp16)[name = tensor("v_31_cast_fp16")]; tensor var_604 = const()[name = tensor("op_604"), val = tensor([50, 12, 64])]; tensor var_605_cast_fp16 = reshape(shape = var_604, x = q_31_cast_fp16)[name = tensor("op_605_cast_fp16")]; tensor q_33_perm_0 = const()[name = tensor("q_33_perm_0"), val = tensor([1, 0, 2])]; tensor var_611 = const()[name = tensor("op_611"), val = tensor([50, 12, 64])]; tensor var_612_cast_fp16 = reshape(shape = var_611, x = k_31_cast_fp16)[name = tensor("op_612_cast_fp16")]; tensor k_33_perm_0 = const()[name = tensor("k_33_perm_0"), val = tensor([1, 0, 2])]; tensor var_618 = const()[name = tensor("op_618"), val = tensor([50, 12, 64])]; tensor var_619_cast_fp16 = reshape(shape = var_618, x = v_31_cast_fp16)[name = tensor("op_619_cast_fp16")]; tensor v_33_perm_0 = const()[name = tensor("v_33_perm_0"), val = tensor([1, 0, 2])]; tensor var_622 = const()[name = tensor("op_622"), val = tensor([1, 12, 50, 64])]; tensor q_33_cast_fp16 = transpose(perm = q_33_perm_0, x = var_605_cast_fp16)[name = tensor("transpose_47")]; tensor q_35_cast_fp16 = reshape(shape = var_622, x = q_33_cast_fp16)[name = tensor("q_35_cast_fp16")]; tensor var_624 = const()[name = tensor("op_624"), val = tensor([1, 12, 50, 64])]; tensor k_33_cast_fp16 = transpose(perm = k_33_perm_0, x = var_612_cast_fp16)[name = tensor("transpose_46")]; tensor k_35_cast_fp16 = reshape(shape = var_624, x = k_33_cast_fp16)[name = tensor("k_35_cast_fp16")]; tensor var_626 = const()[name = tensor("op_626"), val = tensor([1, 12, 50, 64])]; tensor v_33_cast_fp16 = transpose(perm = v_33_perm_0, x = var_619_cast_fp16)[name = tensor("transpose_45")]; tensor v_35_cast_fp16 = reshape(shape = var_626, x = v_33_cast_fp16)[name = tensor("v_35_cast_fp16")]; tensor mul_11_y_0_to_fp16 = const()[name = tensor("mul_11_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_11_cast_fp16 = mul(x = q_35_cast_fp16, y = mul_11_y_0_to_fp16)[name = tensor("mul_11_cast_fp16")]; tensor matmul_5_transpose_y_0 = const()[name = tensor("matmul_5_transpose_y_0"), val = tensor(true)]; tensor matmul_5_transpose_x_0 = const()[name = tensor("matmul_5_transpose_x_0"), val = tensor(false)]; tensor matmul_5_cast_fp16 = matmul(transpose_x = matmul_5_transpose_x_0, transpose_y = matmul_5_transpose_y_0, x = mul_11_cast_fp16, y = k_35_cast_fp16)[name = tensor("matmul_5_cast_fp16")]; tensor softmax_5_axis_0 = const()[name = tensor("softmax_5_axis_0"), val = tensor(-1)]; tensor softmax_5_cast_fp16 = softmax(axis = softmax_5_axis_0, x = matmul_5_cast_fp16)[name = tensor("softmax_5_cast_fp16")]; tensor attn_output_41_transpose_x_0 = const()[name = tensor("attn_output_41_transpose_x_0"), val = tensor(false)]; tensor attn_output_41_transpose_y_0 = const()[name = tensor("attn_output_41_transpose_y_0"), val = tensor(false)]; tensor attn_output_41_cast_fp16 = matmul(transpose_x = attn_output_41_transpose_x_0, transpose_y = attn_output_41_transpose_y_0, x = softmax_5_cast_fp16, y = v_35_cast_fp16)[name = tensor("attn_output_41_cast_fp16")]; tensor var_629 = const()[name = tensor("op_629"), val = tensor([2, 0, 1, 3])]; tensor var_634 = const()[name = tensor("op_634"), val = tensor([50, 768])]; tensor var_630_cast_fp16 = transpose(perm = var_629, x = attn_output_41_cast_fp16)[name = tensor("transpose_44")]; tensor attn_output_43_cast_fp16 = reshape(shape = var_634, x = var_630_cast_fp16)[name = tensor("attn_output_43_cast_fp16")]; tensor model_visual_transformer_resblocks_5_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79229824)))]; tensor model_visual_transformer_resblocks_5_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80409536)))]; tensor linear_21_cast_fp16 = linear(bias = model_visual_transformer_resblocks_5_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_5_attn_out_proj_weight_to_fp16, x = attn_output_43_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor var_638 = const()[name = tensor("op_638"), val = tensor([50, 1, 768])]; tensor attn_output_47_cast_fp16 = reshape(shape = var_638, x = linear_21_cast_fp16)[name = tensor("attn_output_47_cast_fp16")]; tensor var_640_perm_0 = const()[name = tensor("op_640_perm_0"), val = tensor([1, 0, 2])]; tensor var_640_cast_fp16 = transpose(perm = var_640_perm_0, x = attn_output_47_cast_fp16)[name = tensor("transpose_43")]; tensor input_55_cast_fp16 = add(x = input_53_cast_fp16, y = var_640_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor x_33_axes_0 = const()[name = tensor("x_33_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_5_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80411136)))]; tensor model_visual_transformer_resblocks_5_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80412736)))]; tensor x_33_cast_fp16 = layer_norm(axes = x_33_axes_0, beta = model_visual_transformer_resblocks_5_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_5_ln_2_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("x_33_cast_fp16")]; tensor model_visual_transformer_resblocks_5_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80414336)))]; tensor model_visual_transformer_resblocks_5_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85132992)))]; tensor linear_22_cast_fp16 = linear(bias = model_visual_transformer_resblocks_5_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_5_mlp_c_fc_weight_to_fp16, x = x_33_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor input_61_mode_0 = const()[name = tensor("input_61_mode_0"), val = tensor("EXACT")]; tensor input_61_cast_fp16 = gelu(mode = input_61_mode_0, x = linear_22_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor model_visual_transformer_resblocks_5_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85139200)))]; tensor model_visual_transformer_resblocks_5_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_5_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89857856)))]; tensor linear_23_cast_fp16 = linear(bias = model_visual_transformer_resblocks_5_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_5_mlp_c_proj_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor input_63_cast_fp16 = add(x = input_55_cast_fp16, y = linear_23_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor x_35_axes_0 = const()[name = tensor("x_35_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_6_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89859456)))]; tensor model_visual_transformer_resblocks_6_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89861056)))]; tensor x_35_cast_fp16 = layer_norm(axes = x_35_axes_0, beta = model_visual_transformer_resblocks_6_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_6_ln_1_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("x_35_cast_fp16")]; tensor query_27_perm_0 = const()[name = tensor("query_27_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_6_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89862656)))]; tensor model_visual_transformer_resblocks_6_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93401664)))]; tensor query_27_cast_fp16 = transpose(perm = query_27_perm_0, x = x_35_cast_fp16)[name = tensor("transpose_42")]; tensor linear_24_cast_fp16 = linear(bias = model_visual_transformer_resblocks_6_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_6_attn_in_proj_weight_to_fp16, x = query_27_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor concat_7 = const()[name = tensor("concat_7"), val = tensor([50, 1, 3, 768])]; tensor var_689_cast_fp16 = reshape(shape = concat_7, x = linear_24_cast_fp16)[name = tensor("op_689_cast_fp16")]; tensor var_690_axes_0 = const()[name = tensor("op_690_axes_0"), val = tensor([0])]; tensor var_690_cast_fp16 = expand_dims(axes = var_690_axes_0, x = var_689_cast_fp16)[name = tensor("op_690_cast_fp16")]; tensor var_691_perm_0 = const()[name = tensor("op_691_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_692_axes_0 = const()[name = tensor("op_692_axes_0"), val = tensor([-2])]; tensor var_691_cast_fp16 = transpose(perm = var_691_perm_0, x = var_690_cast_fp16)[name = tensor("transpose_41")]; tensor var_692_cast_fp16 = squeeze(axes = var_692_axes_0, x = var_691_cast_fp16)[name = tensor("op_692_cast_fp16")]; tensor q_37_begin_0 = const()[name = tensor("q_37_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_37_end_0 = const()[name = tensor("q_37_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_37_end_mask_0 = const()[name = tensor("q_37_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_37_squeeze_mask_0 = const()[name = tensor("q_37_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_37_cast_fp16 = slice_by_index(begin = q_37_begin_0, end = q_37_end_0, end_mask = q_37_end_mask_0, squeeze_mask = q_37_squeeze_mask_0, x = var_692_cast_fp16)[name = tensor("q_37_cast_fp16")]; tensor k_37_begin_0 = const()[name = tensor("k_37_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_37_end_0 = const()[name = tensor("k_37_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_37_end_mask_0 = const()[name = tensor("k_37_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_37_squeeze_mask_0 = const()[name = tensor("k_37_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_37_cast_fp16 = slice_by_index(begin = k_37_begin_0, end = k_37_end_0, end_mask = k_37_end_mask_0, squeeze_mask = k_37_squeeze_mask_0, x = var_692_cast_fp16)[name = tensor("k_37_cast_fp16")]; tensor v_37_begin_0 = const()[name = tensor("v_37_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_37_end_0 = const()[name = tensor("v_37_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_37_end_mask_0 = const()[name = tensor("v_37_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_37_squeeze_mask_0 = const()[name = tensor("v_37_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_37_cast_fp16 = slice_by_index(begin = v_37_begin_0, end = v_37_end_0, end_mask = v_37_end_mask_0, squeeze_mask = v_37_squeeze_mask_0, x = var_692_cast_fp16)[name = tensor("v_37_cast_fp16")]; tensor var_700 = const()[name = tensor("op_700"), val = tensor([50, 12, 64])]; tensor var_701_cast_fp16 = reshape(shape = var_700, x = q_37_cast_fp16)[name = tensor("op_701_cast_fp16")]; tensor q_39_perm_0 = const()[name = tensor("q_39_perm_0"), val = tensor([1, 0, 2])]; tensor var_707 = const()[name = tensor("op_707"), val = tensor([50, 12, 64])]; tensor var_708_cast_fp16 = reshape(shape = var_707, x = k_37_cast_fp16)[name = tensor("op_708_cast_fp16")]; tensor k_39_perm_0 = const()[name = tensor("k_39_perm_0"), val = tensor([1, 0, 2])]; tensor var_714 = const()[name = tensor("op_714"), val = tensor([50, 12, 64])]; tensor var_715_cast_fp16 = reshape(shape = var_714, x = v_37_cast_fp16)[name = tensor("op_715_cast_fp16")]; tensor v_39_perm_0 = const()[name = tensor("v_39_perm_0"), val = tensor([1, 0, 2])]; tensor var_718 = const()[name = tensor("op_718"), val = tensor([1, 12, 50, 64])]; tensor q_39_cast_fp16 = transpose(perm = q_39_perm_0, x = var_701_cast_fp16)[name = tensor("transpose_40")]; tensor q_41_cast_fp16 = reshape(shape = var_718, x = q_39_cast_fp16)[name = tensor("q_41_cast_fp16")]; tensor var_720 = const()[name = tensor("op_720"), val = tensor([1, 12, 50, 64])]; tensor k_39_cast_fp16 = transpose(perm = k_39_perm_0, x = var_708_cast_fp16)[name = tensor("transpose_39")]; tensor k_41_cast_fp16 = reshape(shape = var_720, x = k_39_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor var_722 = const()[name = tensor("op_722"), val = tensor([1, 12, 50, 64])]; tensor v_39_cast_fp16 = transpose(perm = v_39_perm_0, x = var_715_cast_fp16)[name = tensor("transpose_38")]; tensor v_41_cast_fp16 = reshape(shape = var_722, x = v_39_cast_fp16)[name = tensor("v_41_cast_fp16")]; tensor mul_13_y_0_to_fp16 = const()[name = tensor("mul_13_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_13_cast_fp16 = mul(x = q_41_cast_fp16, y = mul_13_y_0_to_fp16)[name = tensor("mul_13_cast_fp16")]; tensor matmul_6_transpose_y_0 = const()[name = tensor("matmul_6_transpose_y_0"), val = tensor(true)]; tensor matmul_6_transpose_x_0 = const()[name = tensor("matmul_6_transpose_x_0"), val = tensor(false)]; tensor matmul_6_cast_fp16 = matmul(transpose_x = matmul_6_transpose_x_0, transpose_y = matmul_6_transpose_y_0, x = mul_13_cast_fp16, y = k_41_cast_fp16)[name = tensor("matmul_6_cast_fp16")]; tensor softmax_6_axis_0 = const()[name = tensor("softmax_6_axis_0"), val = tensor(-1)]; tensor softmax_6_cast_fp16 = softmax(axis = softmax_6_axis_0, x = matmul_6_cast_fp16)[name = tensor("softmax_6_cast_fp16")]; tensor attn_output_49_transpose_x_0 = const()[name = tensor("attn_output_49_transpose_x_0"), val = tensor(false)]; tensor attn_output_49_transpose_y_0 = const()[name = tensor("attn_output_49_transpose_y_0"), val = tensor(false)]; tensor attn_output_49_cast_fp16 = matmul(transpose_x = attn_output_49_transpose_x_0, transpose_y = attn_output_49_transpose_y_0, x = softmax_6_cast_fp16, y = v_41_cast_fp16)[name = tensor("attn_output_49_cast_fp16")]; tensor var_725 = const()[name = tensor("op_725"), val = tensor([2, 0, 1, 3])]; tensor var_730 = const()[name = tensor("op_730"), val = tensor([50, 768])]; tensor var_726_cast_fp16 = transpose(perm = var_725, x = attn_output_49_cast_fp16)[name = tensor("transpose_37")]; tensor attn_output_51_cast_fp16 = reshape(shape = var_730, x = var_726_cast_fp16)[name = tensor("attn_output_51_cast_fp16")]; tensor model_visual_transformer_resblocks_6_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93406336)))]; tensor model_visual_transformer_resblocks_6_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94586048)))]; tensor linear_25_cast_fp16 = linear(bias = model_visual_transformer_resblocks_6_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_6_attn_out_proj_weight_to_fp16, x = attn_output_51_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor var_734 = const()[name = tensor("op_734"), val = tensor([50, 1, 768])]; tensor attn_output_55_cast_fp16 = reshape(shape = var_734, x = linear_25_cast_fp16)[name = tensor("attn_output_55_cast_fp16")]; tensor var_736_perm_0 = const()[name = tensor("op_736_perm_0"), val = tensor([1, 0, 2])]; tensor var_736_cast_fp16 = transpose(perm = var_736_perm_0, x = attn_output_55_cast_fp16)[name = tensor("transpose_36")]; tensor input_65_cast_fp16 = add(x = input_63_cast_fp16, y = var_736_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor x_37_axes_0 = const()[name = tensor("x_37_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_6_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94587648)))]; tensor model_visual_transformer_resblocks_6_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94589248)))]; tensor x_37_cast_fp16 = layer_norm(axes = x_37_axes_0, beta = model_visual_transformer_resblocks_6_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_6_ln_2_weight_to_fp16, x = input_65_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor model_visual_transformer_resblocks_6_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94590848)))]; tensor model_visual_transformer_resblocks_6_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(99309504)))]; tensor linear_26_cast_fp16 = linear(bias = model_visual_transformer_resblocks_6_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_6_mlp_c_fc_weight_to_fp16, x = x_37_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor input_71_mode_0 = const()[name = tensor("input_71_mode_0"), val = tensor("EXACT")]; tensor input_71_cast_fp16 = gelu(mode = input_71_mode_0, x = linear_26_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor model_visual_transformer_resblocks_6_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(99315712)))]; tensor model_visual_transformer_resblocks_6_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_6_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104034368)))]; tensor linear_27_cast_fp16 = linear(bias = model_visual_transformer_resblocks_6_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_6_mlp_c_proj_weight_to_fp16, x = input_71_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor input_73_cast_fp16 = add(x = input_65_cast_fp16, y = linear_27_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor x_39_axes_0 = const()[name = tensor("x_39_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_7_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104035968)))]; tensor model_visual_transformer_resblocks_7_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104037568)))]; tensor x_39_cast_fp16 = layer_norm(axes = x_39_axes_0, beta = model_visual_transformer_resblocks_7_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_7_ln_1_weight_to_fp16, x = input_73_cast_fp16)[name = tensor("x_39_cast_fp16")]; tensor query_31_perm_0 = const()[name = tensor("query_31_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_7_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104039168)))]; tensor model_visual_transformer_resblocks_7_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107578176)))]; tensor query_31_cast_fp16 = transpose(perm = query_31_perm_0, x = x_39_cast_fp16)[name = tensor("transpose_35")]; tensor linear_28_cast_fp16 = linear(bias = model_visual_transformer_resblocks_7_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_7_attn_in_proj_weight_to_fp16, x = query_31_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor concat_8 = const()[name = tensor("concat_8"), val = tensor([50, 1, 3, 768])]; tensor var_785_cast_fp16 = reshape(shape = concat_8, x = linear_28_cast_fp16)[name = tensor("op_785_cast_fp16")]; tensor var_786_axes_0 = const()[name = tensor("op_786_axes_0"), val = tensor([0])]; tensor var_786_cast_fp16 = expand_dims(axes = var_786_axes_0, x = var_785_cast_fp16)[name = tensor("op_786_cast_fp16")]; tensor var_787_perm_0 = const()[name = tensor("op_787_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_788_axes_0 = const()[name = tensor("op_788_axes_0"), val = tensor([-2])]; tensor var_787_cast_fp16 = transpose(perm = var_787_perm_0, x = var_786_cast_fp16)[name = tensor("transpose_34")]; tensor var_788_cast_fp16 = squeeze(axes = var_788_axes_0, x = var_787_cast_fp16)[name = tensor("op_788_cast_fp16")]; tensor q_43_begin_0 = const()[name = tensor("q_43_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_43_end_0 = const()[name = tensor("q_43_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_43_end_mask_0 = const()[name = tensor("q_43_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_43_squeeze_mask_0 = const()[name = tensor("q_43_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_43_cast_fp16 = slice_by_index(begin = q_43_begin_0, end = q_43_end_0, end_mask = q_43_end_mask_0, squeeze_mask = q_43_squeeze_mask_0, x = var_788_cast_fp16)[name = tensor("q_43_cast_fp16")]; tensor k_43_begin_0 = const()[name = tensor("k_43_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_43_end_0 = const()[name = tensor("k_43_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_43_end_mask_0 = const()[name = tensor("k_43_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_43_squeeze_mask_0 = const()[name = tensor("k_43_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_43_cast_fp16 = slice_by_index(begin = k_43_begin_0, end = k_43_end_0, end_mask = k_43_end_mask_0, squeeze_mask = k_43_squeeze_mask_0, x = var_788_cast_fp16)[name = tensor("k_43_cast_fp16")]; tensor v_43_begin_0 = const()[name = tensor("v_43_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_43_end_0 = const()[name = tensor("v_43_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_43_end_mask_0 = const()[name = tensor("v_43_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_43_squeeze_mask_0 = const()[name = tensor("v_43_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_43_cast_fp16 = slice_by_index(begin = v_43_begin_0, end = v_43_end_0, end_mask = v_43_end_mask_0, squeeze_mask = v_43_squeeze_mask_0, x = var_788_cast_fp16)[name = tensor("v_43_cast_fp16")]; tensor var_796 = const()[name = tensor("op_796"), val = tensor([50, 12, 64])]; tensor var_797_cast_fp16 = reshape(shape = var_796, x = q_43_cast_fp16)[name = tensor("op_797_cast_fp16")]; tensor q_45_perm_0 = const()[name = tensor("q_45_perm_0"), val = tensor([1, 0, 2])]; tensor var_803 = const()[name = tensor("op_803"), val = tensor([50, 12, 64])]; tensor var_804_cast_fp16 = reshape(shape = var_803, x = k_43_cast_fp16)[name = tensor("op_804_cast_fp16")]; tensor k_45_perm_0 = const()[name = tensor("k_45_perm_0"), val = tensor([1, 0, 2])]; tensor var_810 = const()[name = tensor("op_810"), val = tensor([50, 12, 64])]; tensor var_811_cast_fp16 = reshape(shape = var_810, x = v_43_cast_fp16)[name = tensor("op_811_cast_fp16")]; tensor v_45_perm_0 = const()[name = tensor("v_45_perm_0"), val = tensor([1, 0, 2])]; tensor var_814 = const()[name = tensor("op_814"), val = tensor([1, 12, 50, 64])]; tensor q_45_cast_fp16 = transpose(perm = q_45_perm_0, x = var_797_cast_fp16)[name = tensor("transpose_33")]; tensor q_47_cast_fp16 = reshape(shape = var_814, x = q_45_cast_fp16)[name = tensor("q_47_cast_fp16")]; tensor var_816 = const()[name = tensor("op_816"), val = tensor([1, 12, 50, 64])]; tensor k_45_cast_fp16 = transpose(perm = k_45_perm_0, x = var_804_cast_fp16)[name = tensor("transpose_32")]; tensor k_47_cast_fp16 = reshape(shape = var_816, x = k_45_cast_fp16)[name = tensor("k_47_cast_fp16")]; tensor var_818 = const()[name = tensor("op_818"), val = tensor([1, 12, 50, 64])]; tensor v_45_cast_fp16 = transpose(perm = v_45_perm_0, x = var_811_cast_fp16)[name = tensor("transpose_31")]; tensor v_47_cast_fp16 = reshape(shape = var_818, x = v_45_cast_fp16)[name = tensor("v_47_cast_fp16")]; tensor mul_15_y_0_to_fp16 = const()[name = tensor("mul_15_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_15_cast_fp16 = mul(x = q_47_cast_fp16, y = mul_15_y_0_to_fp16)[name = tensor("mul_15_cast_fp16")]; tensor matmul_7_transpose_y_0 = const()[name = tensor("matmul_7_transpose_y_0"), val = tensor(true)]; tensor matmul_7_transpose_x_0 = const()[name = tensor("matmul_7_transpose_x_0"), val = tensor(false)]; tensor matmul_7_cast_fp16 = matmul(transpose_x = matmul_7_transpose_x_0, transpose_y = matmul_7_transpose_y_0, x = mul_15_cast_fp16, y = k_47_cast_fp16)[name = tensor("matmul_7_cast_fp16")]; tensor softmax_7_axis_0 = const()[name = tensor("softmax_7_axis_0"), val = tensor(-1)]; tensor softmax_7_cast_fp16 = softmax(axis = softmax_7_axis_0, x = matmul_7_cast_fp16)[name = tensor("softmax_7_cast_fp16")]; tensor attn_output_57_transpose_x_0 = const()[name = tensor("attn_output_57_transpose_x_0"), val = tensor(false)]; tensor attn_output_57_transpose_y_0 = const()[name = tensor("attn_output_57_transpose_y_0"), val = tensor(false)]; tensor attn_output_57_cast_fp16 = matmul(transpose_x = attn_output_57_transpose_x_0, transpose_y = attn_output_57_transpose_y_0, x = softmax_7_cast_fp16, y = v_47_cast_fp16)[name = tensor("attn_output_57_cast_fp16")]; tensor var_821 = const()[name = tensor("op_821"), val = tensor([2, 0, 1, 3])]; tensor var_826 = const()[name = tensor("op_826"), val = tensor([50, 768])]; tensor var_822_cast_fp16 = transpose(perm = var_821, x = attn_output_57_cast_fp16)[name = tensor("transpose_30")]; tensor attn_output_59_cast_fp16 = reshape(shape = var_826, x = var_822_cast_fp16)[name = tensor("attn_output_59_cast_fp16")]; tensor model_visual_transformer_resblocks_7_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107582848)))]; tensor model_visual_transformer_resblocks_7_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108762560)))]; tensor linear_29_cast_fp16 = linear(bias = model_visual_transformer_resblocks_7_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_7_attn_out_proj_weight_to_fp16, x = attn_output_59_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor var_830 = const()[name = tensor("op_830"), val = tensor([50, 1, 768])]; tensor attn_output_63_cast_fp16 = reshape(shape = var_830, x = linear_29_cast_fp16)[name = tensor("attn_output_63_cast_fp16")]; tensor var_832_perm_0 = const()[name = tensor("op_832_perm_0"), val = tensor([1, 0, 2])]; tensor var_832_cast_fp16 = transpose(perm = var_832_perm_0, x = attn_output_63_cast_fp16)[name = tensor("transpose_29")]; tensor input_75_cast_fp16 = add(x = input_73_cast_fp16, y = var_832_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor x_41_axes_0 = const()[name = tensor("x_41_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_7_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108764160)))]; tensor model_visual_transformer_resblocks_7_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108765760)))]; tensor x_41_cast_fp16 = layer_norm(axes = x_41_axes_0, beta = model_visual_transformer_resblocks_7_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_7_ln_2_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor model_visual_transformer_resblocks_7_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108767360)))]; tensor model_visual_transformer_resblocks_7_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113486016)))]; tensor linear_30_cast_fp16 = linear(bias = model_visual_transformer_resblocks_7_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_7_mlp_c_fc_weight_to_fp16, x = x_41_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor input_81_mode_0 = const()[name = tensor("input_81_mode_0"), val = tensor("EXACT")]; tensor input_81_cast_fp16 = gelu(mode = input_81_mode_0, x = linear_30_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor model_visual_transformer_resblocks_7_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113492224)))]; tensor model_visual_transformer_resblocks_7_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_7_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118210880)))]; tensor linear_31_cast_fp16 = linear(bias = model_visual_transformer_resblocks_7_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_7_mlp_c_proj_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor input_83_cast_fp16 = add(x = input_75_cast_fp16, y = linear_31_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor x_43_axes_0 = const()[name = tensor("x_43_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_8_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118212480)))]; tensor model_visual_transformer_resblocks_8_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118214080)))]; tensor x_43_cast_fp16 = layer_norm(axes = x_43_axes_0, beta = model_visual_transformer_resblocks_8_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_8_ln_1_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor query_35_perm_0 = const()[name = tensor("query_35_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_8_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118215680)))]; tensor model_visual_transformer_resblocks_8_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121754688)))]; tensor query_35_cast_fp16 = transpose(perm = query_35_perm_0, x = x_43_cast_fp16)[name = tensor("transpose_28")]; tensor linear_32_cast_fp16 = linear(bias = model_visual_transformer_resblocks_8_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_8_attn_in_proj_weight_to_fp16, x = query_35_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor concat_9 = const()[name = tensor("concat_9"), val = tensor([50, 1, 3, 768])]; tensor var_881_cast_fp16 = reshape(shape = concat_9, x = linear_32_cast_fp16)[name = tensor("op_881_cast_fp16")]; tensor var_882_axes_0 = const()[name = tensor("op_882_axes_0"), val = tensor([0])]; tensor var_882_cast_fp16 = expand_dims(axes = var_882_axes_0, x = var_881_cast_fp16)[name = tensor("op_882_cast_fp16")]; tensor var_883_perm_0 = const()[name = tensor("op_883_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_884_axes_0 = const()[name = tensor("op_884_axes_0"), val = tensor([-2])]; tensor var_883_cast_fp16 = transpose(perm = var_883_perm_0, x = var_882_cast_fp16)[name = tensor("transpose_27")]; tensor var_884_cast_fp16 = squeeze(axes = var_884_axes_0, x = var_883_cast_fp16)[name = tensor("op_884_cast_fp16")]; tensor q_49_begin_0 = const()[name = tensor("q_49_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_49_end_0 = const()[name = tensor("q_49_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_49_end_mask_0 = const()[name = tensor("q_49_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_49_squeeze_mask_0 = const()[name = tensor("q_49_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_49_cast_fp16 = slice_by_index(begin = q_49_begin_0, end = q_49_end_0, end_mask = q_49_end_mask_0, squeeze_mask = q_49_squeeze_mask_0, x = var_884_cast_fp16)[name = tensor("q_49_cast_fp16")]; tensor k_49_begin_0 = const()[name = tensor("k_49_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_49_end_0 = const()[name = tensor("k_49_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_49_end_mask_0 = const()[name = tensor("k_49_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_49_squeeze_mask_0 = const()[name = tensor("k_49_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_49_cast_fp16 = slice_by_index(begin = k_49_begin_0, end = k_49_end_0, end_mask = k_49_end_mask_0, squeeze_mask = k_49_squeeze_mask_0, x = var_884_cast_fp16)[name = tensor("k_49_cast_fp16")]; tensor v_49_begin_0 = const()[name = tensor("v_49_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_49_end_0 = const()[name = tensor("v_49_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_49_end_mask_0 = const()[name = tensor("v_49_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_49_squeeze_mask_0 = const()[name = tensor("v_49_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_49_cast_fp16 = slice_by_index(begin = v_49_begin_0, end = v_49_end_0, end_mask = v_49_end_mask_0, squeeze_mask = v_49_squeeze_mask_0, x = var_884_cast_fp16)[name = tensor("v_49_cast_fp16")]; tensor var_892 = const()[name = tensor("op_892"), val = tensor([50, 12, 64])]; tensor var_893_cast_fp16 = reshape(shape = var_892, x = q_49_cast_fp16)[name = tensor("op_893_cast_fp16")]; tensor q_51_perm_0 = const()[name = tensor("q_51_perm_0"), val = tensor([1, 0, 2])]; tensor var_899 = const()[name = tensor("op_899"), val = tensor([50, 12, 64])]; tensor var_900_cast_fp16 = reshape(shape = var_899, x = k_49_cast_fp16)[name = tensor("op_900_cast_fp16")]; tensor k_51_perm_0 = const()[name = tensor("k_51_perm_0"), val = tensor([1, 0, 2])]; tensor var_906 = const()[name = tensor("op_906"), val = tensor([50, 12, 64])]; tensor var_907_cast_fp16 = reshape(shape = var_906, x = v_49_cast_fp16)[name = tensor("op_907_cast_fp16")]; tensor v_51_perm_0 = const()[name = tensor("v_51_perm_0"), val = tensor([1, 0, 2])]; tensor var_910 = const()[name = tensor("op_910"), val = tensor([1, 12, 50, 64])]; tensor q_51_cast_fp16 = transpose(perm = q_51_perm_0, x = var_893_cast_fp16)[name = tensor("transpose_26")]; tensor q_53_cast_fp16 = reshape(shape = var_910, x = q_51_cast_fp16)[name = tensor("q_53_cast_fp16")]; tensor var_912 = const()[name = tensor("op_912"), val = tensor([1, 12, 50, 64])]; tensor k_51_cast_fp16 = transpose(perm = k_51_perm_0, x = var_900_cast_fp16)[name = tensor("transpose_25")]; tensor k_53_cast_fp16 = reshape(shape = var_912, x = k_51_cast_fp16)[name = tensor("k_53_cast_fp16")]; tensor var_914 = const()[name = tensor("op_914"), val = tensor([1, 12, 50, 64])]; tensor v_51_cast_fp16 = transpose(perm = v_51_perm_0, x = var_907_cast_fp16)[name = tensor("transpose_24")]; tensor v_53_cast_fp16 = reshape(shape = var_914, x = v_51_cast_fp16)[name = tensor("v_53_cast_fp16")]; tensor mul_17_y_0_to_fp16 = const()[name = tensor("mul_17_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_17_cast_fp16 = mul(x = q_53_cast_fp16, y = mul_17_y_0_to_fp16)[name = tensor("mul_17_cast_fp16")]; tensor matmul_8_transpose_y_0 = const()[name = tensor("matmul_8_transpose_y_0"), val = tensor(true)]; tensor matmul_8_transpose_x_0 = const()[name = tensor("matmul_8_transpose_x_0"), val = tensor(false)]; tensor matmul_8_cast_fp16 = matmul(transpose_x = matmul_8_transpose_x_0, transpose_y = matmul_8_transpose_y_0, x = mul_17_cast_fp16, y = k_53_cast_fp16)[name = tensor("matmul_8_cast_fp16")]; tensor softmax_8_axis_0 = const()[name = tensor("softmax_8_axis_0"), val = tensor(-1)]; tensor softmax_8_cast_fp16 = softmax(axis = softmax_8_axis_0, x = matmul_8_cast_fp16)[name = tensor("softmax_8_cast_fp16")]; tensor attn_output_65_transpose_x_0 = const()[name = tensor("attn_output_65_transpose_x_0"), val = tensor(false)]; tensor attn_output_65_transpose_y_0 = const()[name = tensor("attn_output_65_transpose_y_0"), val = tensor(false)]; tensor attn_output_65_cast_fp16 = matmul(transpose_x = attn_output_65_transpose_x_0, transpose_y = attn_output_65_transpose_y_0, x = softmax_8_cast_fp16, y = v_53_cast_fp16)[name = tensor("attn_output_65_cast_fp16")]; tensor var_917 = const()[name = tensor("op_917"), val = tensor([2, 0, 1, 3])]; tensor var_922 = const()[name = tensor("op_922"), val = tensor([50, 768])]; tensor var_918_cast_fp16 = transpose(perm = var_917, x = attn_output_65_cast_fp16)[name = tensor("transpose_23")]; tensor attn_output_67_cast_fp16 = reshape(shape = var_922, x = var_918_cast_fp16)[name = tensor("attn_output_67_cast_fp16")]; tensor model_visual_transformer_resblocks_8_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121759360)))]; tensor model_visual_transformer_resblocks_8_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122939072)))]; tensor linear_33_cast_fp16 = linear(bias = model_visual_transformer_resblocks_8_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_8_attn_out_proj_weight_to_fp16, x = attn_output_67_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor var_926 = const()[name = tensor("op_926"), val = tensor([50, 1, 768])]; tensor attn_output_71_cast_fp16 = reshape(shape = var_926, x = linear_33_cast_fp16)[name = tensor("attn_output_71_cast_fp16")]; tensor var_928_perm_0 = const()[name = tensor("op_928_perm_0"), val = tensor([1, 0, 2])]; tensor var_928_cast_fp16 = transpose(perm = var_928_perm_0, x = attn_output_71_cast_fp16)[name = tensor("transpose_22")]; tensor input_85_cast_fp16 = add(x = input_83_cast_fp16, y = var_928_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor x_45_axes_0 = const()[name = tensor("x_45_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_8_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122940672)))]; tensor model_visual_transformer_resblocks_8_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122942272)))]; tensor x_45_cast_fp16 = layer_norm(axes = x_45_axes_0, beta = model_visual_transformer_resblocks_8_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_8_ln_2_weight_to_fp16, x = input_85_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor model_visual_transformer_resblocks_8_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122943872)))]; tensor model_visual_transformer_resblocks_8_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127662528)))]; tensor linear_34_cast_fp16 = linear(bias = model_visual_transformer_resblocks_8_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_8_mlp_c_fc_weight_to_fp16, x = x_45_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_91_mode_0 = const()[name = tensor("input_91_mode_0"), val = tensor("EXACT")]; tensor input_91_cast_fp16 = gelu(mode = input_91_mode_0, x = linear_34_cast_fp16)[name = tensor("input_91_cast_fp16")]; tensor model_visual_transformer_resblocks_8_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127668736)))]; tensor model_visual_transformer_resblocks_8_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_8_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132387392)))]; tensor linear_35_cast_fp16 = linear(bias = model_visual_transformer_resblocks_8_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_8_mlp_c_proj_weight_to_fp16, x = input_91_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_93_cast_fp16 = add(x = input_85_cast_fp16, y = linear_35_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor x_47_axes_0 = const()[name = tensor("x_47_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_9_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132388992)))]; tensor model_visual_transformer_resblocks_9_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132390592)))]; tensor x_47_cast_fp16 = layer_norm(axes = x_47_axes_0, beta = model_visual_transformer_resblocks_9_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_9_ln_1_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor query_39_perm_0 = const()[name = tensor("query_39_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_9_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132392192)))]; tensor model_visual_transformer_resblocks_9_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135931200)))]; tensor query_39_cast_fp16 = transpose(perm = query_39_perm_0, x = x_47_cast_fp16)[name = tensor("transpose_21")]; tensor linear_36_cast_fp16 = linear(bias = model_visual_transformer_resblocks_9_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_9_attn_in_proj_weight_to_fp16, x = query_39_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor concat_10 = const()[name = tensor("concat_10"), val = tensor([50, 1, 3, 768])]; tensor var_977_cast_fp16 = reshape(shape = concat_10, x = linear_36_cast_fp16)[name = tensor("op_977_cast_fp16")]; tensor var_978_axes_0 = const()[name = tensor("op_978_axes_0"), val = tensor([0])]; tensor var_978_cast_fp16 = expand_dims(axes = var_978_axes_0, x = var_977_cast_fp16)[name = tensor("op_978_cast_fp16")]; tensor var_979_perm_0 = const()[name = tensor("op_979_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_980_axes_0 = const()[name = tensor("op_980_axes_0"), val = tensor([-2])]; tensor var_979_cast_fp16 = transpose(perm = var_979_perm_0, x = var_978_cast_fp16)[name = tensor("transpose_20")]; tensor var_980_cast_fp16 = squeeze(axes = var_980_axes_0, x = var_979_cast_fp16)[name = tensor("op_980_cast_fp16")]; tensor q_55_begin_0 = const()[name = tensor("q_55_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_55_end_0 = const()[name = tensor("q_55_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_55_end_mask_0 = const()[name = tensor("q_55_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_55_squeeze_mask_0 = const()[name = tensor("q_55_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_55_cast_fp16 = slice_by_index(begin = q_55_begin_0, end = q_55_end_0, end_mask = q_55_end_mask_0, squeeze_mask = q_55_squeeze_mask_0, x = var_980_cast_fp16)[name = tensor("q_55_cast_fp16")]; tensor k_55_begin_0 = const()[name = tensor("k_55_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_55_end_0 = const()[name = tensor("k_55_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_55_end_mask_0 = const()[name = tensor("k_55_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_55_squeeze_mask_0 = const()[name = tensor("k_55_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_55_cast_fp16 = slice_by_index(begin = k_55_begin_0, end = k_55_end_0, end_mask = k_55_end_mask_0, squeeze_mask = k_55_squeeze_mask_0, x = var_980_cast_fp16)[name = tensor("k_55_cast_fp16")]; tensor v_55_begin_0 = const()[name = tensor("v_55_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_55_end_0 = const()[name = tensor("v_55_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_55_end_mask_0 = const()[name = tensor("v_55_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_55_squeeze_mask_0 = const()[name = tensor("v_55_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_55_cast_fp16 = slice_by_index(begin = v_55_begin_0, end = v_55_end_0, end_mask = v_55_end_mask_0, squeeze_mask = v_55_squeeze_mask_0, x = var_980_cast_fp16)[name = tensor("v_55_cast_fp16")]; tensor var_988 = const()[name = tensor("op_988"), val = tensor([50, 12, 64])]; tensor var_989_cast_fp16 = reshape(shape = var_988, x = q_55_cast_fp16)[name = tensor("op_989_cast_fp16")]; tensor q_57_perm_0 = const()[name = tensor("q_57_perm_0"), val = tensor([1, 0, 2])]; tensor var_995 = const()[name = tensor("op_995"), val = tensor([50, 12, 64])]; tensor var_996_cast_fp16 = reshape(shape = var_995, x = k_55_cast_fp16)[name = tensor("op_996_cast_fp16")]; tensor k_57_perm_0 = const()[name = tensor("k_57_perm_0"), val = tensor([1, 0, 2])]; tensor var_1002 = const()[name = tensor("op_1002"), val = tensor([50, 12, 64])]; tensor var_1003_cast_fp16 = reshape(shape = var_1002, x = v_55_cast_fp16)[name = tensor("op_1003_cast_fp16")]; tensor v_57_perm_0 = const()[name = tensor("v_57_perm_0"), val = tensor([1, 0, 2])]; tensor var_1006 = const()[name = tensor("op_1006"), val = tensor([1, 12, 50, 64])]; tensor q_57_cast_fp16 = transpose(perm = q_57_perm_0, x = var_989_cast_fp16)[name = tensor("transpose_19")]; tensor q_59_cast_fp16 = reshape(shape = var_1006, x = q_57_cast_fp16)[name = tensor("q_59_cast_fp16")]; tensor var_1008 = const()[name = tensor("op_1008"), val = tensor([1, 12, 50, 64])]; tensor k_57_cast_fp16 = transpose(perm = k_57_perm_0, x = var_996_cast_fp16)[name = tensor("transpose_18")]; tensor k_59_cast_fp16 = reshape(shape = var_1008, x = k_57_cast_fp16)[name = tensor("k_59_cast_fp16")]; tensor var_1010 = const()[name = tensor("op_1010"), val = tensor([1, 12, 50, 64])]; tensor v_57_cast_fp16 = transpose(perm = v_57_perm_0, x = var_1003_cast_fp16)[name = tensor("transpose_17")]; tensor v_59_cast_fp16 = reshape(shape = var_1010, x = v_57_cast_fp16)[name = tensor("v_59_cast_fp16")]; tensor mul_19_y_0_to_fp16 = const()[name = tensor("mul_19_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_19_cast_fp16 = mul(x = q_59_cast_fp16, y = mul_19_y_0_to_fp16)[name = tensor("mul_19_cast_fp16")]; tensor matmul_9_transpose_y_0 = const()[name = tensor("matmul_9_transpose_y_0"), val = tensor(true)]; tensor matmul_9_transpose_x_0 = const()[name = tensor("matmul_9_transpose_x_0"), val = tensor(false)]; tensor matmul_9_cast_fp16 = matmul(transpose_x = matmul_9_transpose_x_0, transpose_y = matmul_9_transpose_y_0, x = mul_19_cast_fp16, y = k_59_cast_fp16)[name = tensor("matmul_9_cast_fp16")]; tensor softmax_9_axis_0 = const()[name = tensor("softmax_9_axis_0"), val = tensor(-1)]; tensor softmax_9_cast_fp16 = softmax(axis = softmax_9_axis_0, x = matmul_9_cast_fp16)[name = tensor("softmax_9_cast_fp16")]; tensor attn_output_73_transpose_x_0 = const()[name = tensor("attn_output_73_transpose_x_0"), val = tensor(false)]; tensor attn_output_73_transpose_y_0 = const()[name = tensor("attn_output_73_transpose_y_0"), val = tensor(false)]; tensor attn_output_73_cast_fp16 = matmul(transpose_x = attn_output_73_transpose_x_0, transpose_y = attn_output_73_transpose_y_0, x = softmax_9_cast_fp16, y = v_59_cast_fp16)[name = tensor("attn_output_73_cast_fp16")]; tensor var_1013 = const()[name = tensor("op_1013"), val = tensor([2, 0, 1, 3])]; tensor var_1018 = const()[name = tensor("op_1018"), val = tensor([50, 768])]; tensor var_1014_cast_fp16 = transpose(perm = var_1013, x = attn_output_73_cast_fp16)[name = tensor("transpose_16")]; tensor attn_output_75_cast_fp16 = reshape(shape = var_1018, x = var_1014_cast_fp16)[name = tensor("attn_output_75_cast_fp16")]; tensor model_visual_transformer_resblocks_9_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135935872)))]; tensor model_visual_transformer_resblocks_9_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137115584)))]; tensor linear_37_cast_fp16 = linear(bias = model_visual_transformer_resblocks_9_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_9_attn_out_proj_weight_to_fp16, x = attn_output_75_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor var_1022 = const()[name = tensor("op_1022"), val = tensor([50, 1, 768])]; tensor attn_output_79_cast_fp16 = reshape(shape = var_1022, x = linear_37_cast_fp16)[name = tensor("attn_output_79_cast_fp16")]; tensor var_1024_perm_0 = const()[name = tensor("op_1024_perm_0"), val = tensor([1, 0, 2])]; tensor var_1024_cast_fp16 = transpose(perm = var_1024_perm_0, x = attn_output_79_cast_fp16)[name = tensor("transpose_15")]; tensor input_95_cast_fp16 = add(x = input_93_cast_fp16, y = var_1024_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor x_49_axes_0 = const()[name = tensor("x_49_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_9_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137117184)))]; tensor model_visual_transformer_resblocks_9_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137118784)))]; tensor x_49_cast_fp16 = layer_norm(axes = x_49_axes_0, beta = model_visual_transformer_resblocks_9_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_9_ln_2_weight_to_fp16, x = input_95_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor model_visual_transformer_resblocks_9_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137120384)))]; tensor model_visual_transformer_resblocks_9_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141839040)))]; tensor linear_38_cast_fp16 = linear(bias = model_visual_transformer_resblocks_9_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_9_mlp_c_fc_weight_to_fp16, x = x_49_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor input_101_mode_0 = const()[name = tensor("input_101_mode_0"), val = tensor("EXACT")]; tensor input_101_cast_fp16 = gelu(mode = input_101_mode_0, x = linear_38_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor model_visual_transformer_resblocks_9_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141845248)))]; tensor model_visual_transformer_resblocks_9_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_9_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146563904)))]; tensor linear_39_cast_fp16 = linear(bias = model_visual_transformer_resblocks_9_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_9_mlp_c_proj_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor input_103_cast_fp16 = add(x = input_95_cast_fp16, y = linear_39_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor x_51_axes_0 = const()[name = tensor("x_51_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_10_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146565504)))]; tensor model_visual_transformer_resblocks_10_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146567104)))]; tensor x_51_cast_fp16 = layer_norm(axes = x_51_axes_0, beta = model_visual_transformer_resblocks_10_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_10_ln_1_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("x_51_cast_fp16")]; tensor query_43_perm_0 = const()[name = tensor("query_43_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_10_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146568704)))]; tensor model_visual_transformer_resblocks_10_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(150107712)))]; tensor query_43_cast_fp16 = transpose(perm = query_43_perm_0, x = x_51_cast_fp16)[name = tensor("transpose_14")]; tensor linear_40_cast_fp16 = linear(bias = model_visual_transformer_resblocks_10_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_10_attn_in_proj_weight_to_fp16, x = query_43_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor concat_11 = const()[name = tensor("concat_11"), val = tensor([50, 1, 3, 768])]; tensor var_1073_cast_fp16 = reshape(shape = concat_11, x = linear_40_cast_fp16)[name = tensor("op_1073_cast_fp16")]; tensor var_1074_axes_0 = const()[name = tensor("op_1074_axes_0"), val = tensor([0])]; tensor var_1074_cast_fp16 = expand_dims(axes = var_1074_axes_0, x = var_1073_cast_fp16)[name = tensor("op_1074_cast_fp16")]; tensor var_1075_perm_0 = const()[name = tensor("op_1075_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_1076_axes_0 = const()[name = tensor("op_1076_axes_0"), val = tensor([-2])]; tensor var_1075_cast_fp16 = transpose(perm = var_1075_perm_0, x = var_1074_cast_fp16)[name = tensor("transpose_13")]; tensor var_1076_cast_fp16 = squeeze(axes = var_1076_axes_0, x = var_1075_cast_fp16)[name = tensor("op_1076_cast_fp16")]; tensor q_61_begin_0 = const()[name = tensor("q_61_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_61_end_0 = const()[name = tensor("q_61_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_61_end_mask_0 = const()[name = tensor("q_61_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_61_squeeze_mask_0 = const()[name = tensor("q_61_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_61_cast_fp16 = slice_by_index(begin = q_61_begin_0, end = q_61_end_0, end_mask = q_61_end_mask_0, squeeze_mask = q_61_squeeze_mask_0, x = var_1076_cast_fp16)[name = tensor("q_61_cast_fp16")]; tensor k_61_begin_0 = const()[name = tensor("k_61_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_61_end_0 = const()[name = tensor("k_61_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_61_end_mask_0 = const()[name = tensor("k_61_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_61_squeeze_mask_0 = const()[name = tensor("k_61_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_61_cast_fp16 = slice_by_index(begin = k_61_begin_0, end = k_61_end_0, end_mask = k_61_end_mask_0, squeeze_mask = k_61_squeeze_mask_0, x = var_1076_cast_fp16)[name = tensor("k_61_cast_fp16")]; tensor v_61_begin_0 = const()[name = tensor("v_61_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_61_end_0 = const()[name = tensor("v_61_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_61_end_mask_0 = const()[name = tensor("v_61_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_61_squeeze_mask_0 = const()[name = tensor("v_61_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_61_cast_fp16 = slice_by_index(begin = v_61_begin_0, end = v_61_end_0, end_mask = v_61_end_mask_0, squeeze_mask = v_61_squeeze_mask_0, x = var_1076_cast_fp16)[name = tensor("v_61_cast_fp16")]; tensor var_1084 = const()[name = tensor("op_1084"), val = tensor([50, 12, 64])]; tensor var_1085_cast_fp16 = reshape(shape = var_1084, x = q_61_cast_fp16)[name = tensor("op_1085_cast_fp16")]; tensor q_63_perm_0 = const()[name = tensor("q_63_perm_0"), val = tensor([1, 0, 2])]; tensor var_1091 = const()[name = tensor("op_1091"), val = tensor([50, 12, 64])]; tensor var_1092_cast_fp16 = reshape(shape = var_1091, x = k_61_cast_fp16)[name = tensor("op_1092_cast_fp16")]; tensor k_63_perm_0 = const()[name = tensor("k_63_perm_0"), val = tensor([1, 0, 2])]; tensor var_1098 = const()[name = tensor("op_1098"), val = tensor([50, 12, 64])]; tensor var_1099_cast_fp16 = reshape(shape = var_1098, x = v_61_cast_fp16)[name = tensor("op_1099_cast_fp16")]; tensor v_63_perm_0 = const()[name = tensor("v_63_perm_0"), val = tensor([1, 0, 2])]; tensor var_1102 = const()[name = tensor("op_1102"), val = tensor([1, 12, 50, 64])]; tensor q_63_cast_fp16 = transpose(perm = q_63_perm_0, x = var_1085_cast_fp16)[name = tensor("transpose_12")]; tensor q_65_cast_fp16 = reshape(shape = var_1102, x = q_63_cast_fp16)[name = tensor("q_65_cast_fp16")]; tensor var_1104 = const()[name = tensor("op_1104"), val = tensor([1, 12, 50, 64])]; tensor k_63_cast_fp16 = transpose(perm = k_63_perm_0, x = var_1092_cast_fp16)[name = tensor("transpose_11")]; tensor k_65_cast_fp16 = reshape(shape = var_1104, x = k_63_cast_fp16)[name = tensor("k_65_cast_fp16")]; tensor var_1106 = const()[name = tensor("op_1106"), val = tensor([1, 12, 50, 64])]; tensor v_63_cast_fp16 = transpose(perm = v_63_perm_0, x = var_1099_cast_fp16)[name = tensor("transpose_10")]; tensor v_65_cast_fp16 = reshape(shape = var_1106, x = v_63_cast_fp16)[name = tensor("v_65_cast_fp16")]; tensor mul_21_y_0_to_fp16 = const()[name = tensor("mul_21_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_21_cast_fp16 = mul(x = q_65_cast_fp16, y = mul_21_y_0_to_fp16)[name = tensor("mul_21_cast_fp16")]; tensor matmul_10_transpose_y_0 = const()[name = tensor("matmul_10_transpose_y_0"), val = tensor(true)]; tensor matmul_10_transpose_x_0 = const()[name = tensor("matmul_10_transpose_x_0"), val = tensor(false)]; tensor matmul_10_cast_fp16 = matmul(transpose_x = matmul_10_transpose_x_0, transpose_y = matmul_10_transpose_y_0, x = mul_21_cast_fp16, y = k_65_cast_fp16)[name = tensor("matmul_10_cast_fp16")]; tensor softmax_10_axis_0 = const()[name = tensor("softmax_10_axis_0"), val = tensor(-1)]; tensor softmax_10_cast_fp16 = softmax(axis = softmax_10_axis_0, x = matmul_10_cast_fp16)[name = tensor("softmax_10_cast_fp16")]; tensor attn_output_81_transpose_x_0 = const()[name = tensor("attn_output_81_transpose_x_0"), val = tensor(false)]; tensor attn_output_81_transpose_y_0 = const()[name = tensor("attn_output_81_transpose_y_0"), val = tensor(false)]; tensor attn_output_81_cast_fp16 = matmul(transpose_x = attn_output_81_transpose_x_0, transpose_y = attn_output_81_transpose_y_0, x = softmax_10_cast_fp16, y = v_65_cast_fp16)[name = tensor("attn_output_81_cast_fp16")]; tensor var_1109 = const()[name = tensor("op_1109"), val = tensor([2, 0, 1, 3])]; tensor var_1114 = const()[name = tensor("op_1114"), val = tensor([50, 768])]; tensor var_1110_cast_fp16 = transpose(perm = var_1109, x = attn_output_81_cast_fp16)[name = tensor("transpose_9")]; tensor attn_output_83_cast_fp16 = reshape(shape = var_1114, x = var_1110_cast_fp16)[name = tensor("attn_output_83_cast_fp16")]; tensor model_visual_transformer_resblocks_10_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(150112384)))]; tensor model_visual_transformer_resblocks_10_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151292096)))]; tensor linear_41_cast_fp16 = linear(bias = model_visual_transformer_resblocks_10_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_10_attn_out_proj_weight_to_fp16, x = attn_output_83_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor var_1118 = const()[name = tensor("op_1118"), val = tensor([50, 1, 768])]; tensor attn_output_87_cast_fp16 = reshape(shape = var_1118, x = linear_41_cast_fp16)[name = tensor("attn_output_87_cast_fp16")]; tensor var_1120_perm_0 = const()[name = tensor("op_1120_perm_0"), val = tensor([1, 0, 2])]; tensor var_1120_cast_fp16 = transpose(perm = var_1120_perm_0, x = attn_output_87_cast_fp16)[name = tensor("transpose_8")]; tensor input_105_cast_fp16 = add(x = input_103_cast_fp16, y = var_1120_cast_fp16)[name = tensor("input_105_cast_fp16")]; tensor x_53_axes_0 = const()[name = tensor("x_53_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_10_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151293696)))]; tensor model_visual_transformer_resblocks_10_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151295296)))]; tensor x_53_cast_fp16 = layer_norm(axes = x_53_axes_0, beta = model_visual_transformer_resblocks_10_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_10_ln_2_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor model_visual_transformer_resblocks_10_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151296896)))]; tensor model_visual_transformer_resblocks_10_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156015552)))]; tensor linear_42_cast_fp16 = linear(bias = model_visual_transformer_resblocks_10_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_10_mlp_c_fc_weight_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor input_111_mode_0 = const()[name = tensor("input_111_mode_0"), val = tensor("EXACT")]; tensor input_111_cast_fp16 = gelu(mode = input_111_mode_0, x = linear_42_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor model_visual_transformer_resblocks_10_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156021760)))]; tensor model_visual_transformer_resblocks_10_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_10_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160740416)))]; tensor linear_43_cast_fp16 = linear(bias = model_visual_transformer_resblocks_10_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_10_mlp_c_proj_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor input_113_cast_fp16 = add(x = input_105_cast_fp16, y = linear_43_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor x_55_axes_0 = const()[name = tensor("x_55_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_11_ln_1_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_ln_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160742016)))]; tensor model_visual_transformer_resblocks_11_ln_1_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_ln_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160743616)))]; tensor x_55_cast_fp16 = layer_norm(axes = x_55_axes_0, beta = model_visual_transformer_resblocks_11_ln_1_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_11_ln_1_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor query_perm_0 = const()[name = tensor("query_perm_0"), val = tensor([1, 0, 2])]; tensor model_visual_transformer_resblocks_11_attn_in_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_attn_in_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160745216)))]; tensor model_visual_transformer_resblocks_11_attn_in_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_attn_in_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164284224)))]; tensor query_cast_fp16 = transpose(perm = query_perm_0, x = x_55_cast_fp16)[name = tensor("transpose_7")]; tensor linear_44_cast_fp16 = linear(bias = model_visual_transformer_resblocks_11_attn_in_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_11_attn_in_proj_weight_to_fp16, x = query_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor concat_12 = const()[name = tensor("concat_12"), val = tensor([50, 1, 3, 768])]; tensor var_1169_cast_fp16 = reshape(shape = concat_12, x = linear_44_cast_fp16)[name = tensor("op_1169_cast_fp16")]; tensor var_1170_axes_0 = const()[name = tensor("op_1170_axes_0"), val = tensor([0])]; tensor var_1170_cast_fp16 = expand_dims(axes = var_1170_axes_0, x = var_1169_cast_fp16)[name = tensor("op_1170_cast_fp16")]; tensor var_1171_perm_0 = const()[name = tensor("op_1171_perm_0"), val = tensor([-2, 1, 2, 0, 4])]; tensor var_1172_axes_0 = const()[name = tensor("op_1172_axes_0"), val = tensor([-2])]; tensor var_1171_cast_fp16 = transpose(perm = var_1171_perm_0, x = var_1170_cast_fp16)[name = tensor("transpose_6")]; tensor var_1172_cast_fp16 = squeeze(axes = var_1172_axes_0, x = var_1171_cast_fp16)[name = tensor("op_1172_cast_fp16")]; tensor q_67_begin_0 = const()[name = tensor("q_67_begin_0"), val = tensor([0, 0, 0, 0])]; tensor q_67_end_0 = const()[name = tensor("q_67_end_0"), val = tensor([1, 50, 1, 768])]; tensor q_67_end_mask_0 = const()[name = tensor("q_67_end_mask_0"), val = tensor([false, true, true, true])]; tensor q_67_squeeze_mask_0 = const()[name = tensor("q_67_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor q_67_cast_fp16 = slice_by_index(begin = q_67_begin_0, end = q_67_end_0, end_mask = q_67_end_mask_0, squeeze_mask = q_67_squeeze_mask_0, x = var_1172_cast_fp16)[name = tensor("q_67_cast_fp16")]; tensor k_67_begin_0 = const()[name = tensor("k_67_begin_0"), val = tensor([1, 0, 0, 0])]; tensor k_67_end_0 = const()[name = tensor("k_67_end_0"), val = tensor([2, 50, 1, 768])]; tensor k_67_end_mask_0 = const()[name = tensor("k_67_end_mask_0"), val = tensor([false, true, true, true])]; tensor k_67_squeeze_mask_0 = const()[name = tensor("k_67_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor k_67_cast_fp16 = slice_by_index(begin = k_67_begin_0, end = k_67_end_0, end_mask = k_67_end_mask_0, squeeze_mask = k_67_squeeze_mask_0, x = var_1172_cast_fp16)[name = tensor("k_67_cast_fp16")]; tensor v_67_begin_0 = const()[name = tensor("v_67_begin_0"), val = tensor([2, 0, 0, 0])]; tensor v_67_end_0 = const()[name = tensor("v_67_end_0"), val = tensor([3, 50, 1, 768])]; tensor v_67_end_mask_0 = const()[name = tensor("v_67_end_mask_0"), val = tensor([false, true, true, true])]; tensor v_67_squeeze_mask_0 = const()[name = tensor("v_67_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor v_67_cast_fp16 = slice_by_index(begin = v_67_begin_0, end = v_67_end_0, end_mask = v_67_end_mask_0, squeeze_mask = v_67_squeeze_mask_0, x = var_1172_cast_fp16)[name = tensor("v_67_cast_fp16")]; tensor var_1180 = const()[name = tensor("op_1180"), val = tensor([50, 12, 64])]; tensor var_1181_cast_fp16 = reshape(shape = var_1180, x = q_67_cast_fp16)[name = tensor("op_1181_cast_fp16")]; tensor q_69_perm_0 = const()[name = tensor("q_69_perm_0"), val = tensor([1, 0, 2])]; tensor var_1187 = const()[name = tensor("op_1187"), val = tensor([50, 12, 64])]; tensor var_1188_cast_fp16 = reshape(shape = var_1187, x = k_67_cast_fp16)[name = tensor("op_1188_cast_fp16")]; tensor k_69_perm_0 = const()[name = tensor("k_69_perm_0"), val = tensor([1, 0, 2])]; tensor var_1194 = const()[name = tensor("op_1194"), val = tensor([50, 12, 64])]; tensor var_1195_cast_fp16 = reshape(shape = var_1194, x = v_67_cast_fp16)[name = tensor("op_1195_cast_fp16")]; tensor v_69_perm_0 = const()[name = tensor("v_69_perm_0"), val = tensor([1, 0, 2])]; tensor var_1198 = const()[name = tensor("op_1198"), val = tensor([1, 12, 50, 64])]; tensor q_69_cast_fp16 = transpose(perm = q_69_perm_0, x = var_1181_cast_fp16)[name = tensor("transpose_5")]; tensor q_cast_fp16 = reshape(shape = var_1198, x = q_69_cast_fp16)[name = tensor("q_cast_fp16")]; tensor var_1200 = const()[name = tensor("op_1200"), val = tensor([1, 12, 50, 64])]; tensor k_69_cast_fp16 = transpose(perm = k_69_perm_0, x = var_1188_cast_fp16)[name = tensor("transpose_4")]; tensor k_cast_fp16 = reshape(shape = var_1200, x = k_69_cast_fp16)[name = tensor("k_cast_fp16")]; tensor var_1202 = const()[name = tensor("op_1202"), val = tensor([1, 12, 50, 64])]; tensor v_69_cast_fp16 = transpose(perm = v_69_perm_0, x = var_1195_cast_fp16)[name = tensor("transpose_3")]; tensor v_cast_fp16 = reshape(shape = var_1202, x = v_69_cast_fp16)[name = tensor("v_cast_fp16")]; tensor mul_23_y_0_to_fp16 = const()[name = tensor("mul_23_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor mul_23_cast_fp16 = mul(x = q_cast_fp16, y = mul_23_y_0_to_fp16)[name = tensor("mul_23_cast_fp16")]; tensor matmul_11_transpose_y_0 = const()[name = tensor("matmul_11_transpose_y_0"), val = tensor(true)]; tensor matmul_11_transpose_x_0 = const()[name = tensor("matmul_11_transpose_x_0"), val = tensor(false)]; tensor matmul_11_cast_fp16 = matmul(transpose_x = matmul_11_transpose_x_0, transpose_y = matmul_11_transpose_y_0, x = mul_23_cast_fp16, y = k_cast_fp16)[name = tensor("matmul_11_cast_fp16")]; tensor softmax_11_axis_0 = const()[name = tensor("softmax_11_axis_0"), val = tensor(-1)]; tensor softmax_11_cast_fp16 = softmax(axis = softmax_11_axis_0, x = matmul_11_cast_fp16)[name = tensor("softmax_11_cast_fp16")]; tensor attn_output_89_transpose_x_0 = const()[name = tensor("attn_output_89_transpose_x_0"), val = tensor(false)]; tensor attn_output_89_transpose_y_0 = const()[name = tensor("attn_output_89_transpose_y_0"), val = tensor(false)]; tensor attn_output_89_cast_fp16 = matmul(transpose_x = attn_output_89_transpose_x_0, transpose_y = attn_output_89_transpose_y_0, x = softmax_11_cast_fp16, y = v_cast_fp16)[name = tensor("attn_output_89_cast_fp16")]; tensor var_1205 = const()[name = tensor("op_1205"), val = tensor([2, 0, 1, 3])]; tensor var_1210 = const()[name = tensor("op_1210"), val = tensor([50, 768])]; tensor var_1206_cast_fp16 = transpose(perm = var_1205, x = attn_output_89_cast_fp16)[name = tensor("transpose_2")]; tensor attn_output_91_cast_fp16 = reshape(shape = var_1210, x = var_1206_cast_fp16)[name = tensor("attn_output_91_cast_fp16")]; tensor model_visual_transformer_resblocks_11_attn_out_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_attn_out_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164288896)))]; tensor model_visual_transformer_resblocks_11_attn_out_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165468608)))]; tensor linear_45_cast_fp16 = linear(bias = model_visual_transformer_resblocks_11_attn_out_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_11_attn_out_proj_weight_to_fp16, x = attn_output_91_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor var_1214 = const()[name = tensor("op_1214"), val = tensor([50, 1, 768])]; tensor attn_output_cast_fp16 = reshape(shape = var_1214, x = linear_45_cast_fp16)[name = tensor("attn_output_cast_fp16")]; tensor var_1216_perm_0 = const()[name = tensor("op_1216_perm_0"), val = tensor([1, 0, 2])]; tensor var_1216_cast_fp16 = transpose(perm = var_1216_perm_0, x = attn_output_cast_fp16)[name = tensor("transpose_1")]; tensor input_115_cast_fp16 = add(x = input_113_cast_fp16, y = var_1216_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor x_57_axes_0 = const()[name = tensor("x_57_axes_0"), val = tensor([-1])]; tensor model_visual_transformer_resblocks_11_ln_2_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_ln_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165470208)))]; tensor model_visual_transformer_resblocks_11_ln_2_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_ln_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165471808)))]; tensor x_57_cast_fp16 = layer_norm(axes = x_57_axes_0, beta = model_visual_transformer_resblocks_11_ln_2_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_transformer_resblocks_11_ln_2_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("x_57_cast_fp16")]; tensor model_visual_transformer_resblocks_11_mlp_c_fc_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_mlp_c_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165473408)))]; tensor model_visual_transformer_resblocks_11_mlp_c_fc_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_mlp_c_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170192064)))]; tensor linear_46_cast_fp16 = linear(bias = model_visual_transformer_resblocks_11_mlp_c_fc_bias_to_fp16, weight = model_visual_transformer_resblocks_11_mlp_c_fc_weight_to_fp16, x = x_57_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_121_mode_0 = const()[name = tensor("input_121_mode_0"), val = tensor("EXACT")]; tensor input_121_cast_fp16 = gelu(mode = input_121_mode_0, x = linear_46_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor model_visual_transformer_resblocks_11_mlp_c_proj_weight_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_mlp_c_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170198272)))]; tensor model_visual_transformer_resblocks_11_mlp_c_proj_bias_to_fp16 = const()[name = tensor("model_visual_transformer_resblocks_11_mlp_c_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174916928)))]; tensor linear_47_cast_fp16 = linear(bias = model_visual_transformer_resblocks_11_mlp_c_proj_bias_to_fp16, weight = model_visual_transformer_resblocks_11_mlp_c_proj_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor input_cast_fp16 = add(x = input_115_cast_fp16, y = linear_47_cast_fp16)[name = tensor("input_cast_fp16")]; tensor x_59_axes_0 = const()[name = tensor("x_59_axes_0"), val = tensor([-1])]; tensor model_visual_ln_post_weight_to_fp16 = const()[name = tensor("model_visual_ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174918528)))]; tensor model_visual_ln_post_bias_to_fp16 = const()[name = tensor("model_visual_ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174920128)))]; tensor x_59_cast_fp16 = layer_norm(axes = x_59_axes_0, beta = model_visual_ln_post_bias_to_fp16, epsilon = var_13_to_fp16, gamma = model_visual_ln_post_weight_to_fp16, x = input_cast_fp16)[name = tensor("x_59_cast_fp16")]; tensor pooled_begin_0 = const()[name = tensor("pooled_begin_0"), val = tensor([0, 0, 0])]; tensor pooled_end_0 = const()[name = tensor("pooled_end_0"), val = tensor([1, 1, 768])]; tensor pooled_end_mask_0 = const()[name = tensor("pooled_end_mask_0"), val = tensor([true, false, true])]; tensor pooled_squeeze_mask_0 = const()[name = tensor("pooled_squeeze_mask_0"), val = tensor([false, true, false])]; tensor pooled_cast_fp16 = slice_by_index(begin = pooled_begin_0, end = pooled_end_0, end_mask = pooled_end_mask_0, squeeze_mask = pooled_squeeze_mask_0, x = x_59_cast_fp16)[name = tensor("pooled_cast_fp16")]; tensor transpose_0_to_fp16 = const()[name = tensor("transpose_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174921728)))]; tensor var_1240_bias_0_to_fp16 = const()[name = tensor("op_1240_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175708224)))]; tensor var_1240_cast_fp16 = linear(bias = var_1240_bias_0_to_fp16, weight = transpose_0_to_fp16, x = pooled_cast_fp16)[name = tensor("op_1240_cast_fp16")]; tensor var_1240_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_1240_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_1240 = cast(dtype = var_1240_cast_fp16_to_fp32_dtype_0, x = var_1240_cast_fp16)[name = tensor("cast_134")]; } -> (var_1240); }