program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}})] { func main(tensor mel) [FlexibleShapeInformation = tuple, dict, tensor>>, tuple, dict, dict, tensor>>>>((("DefaultShapes", {{"mel", [1, 128, 100]}}), ("EnumeratedShapes", {{"mel_1_1_1_128_1000_", {{"mel", [1, 128, 1000]}}}, {"mel_1_1_1_128_100_", {{"mel", [1, 128, 100]}}}, {"mel_1_1_1_128_1500_", {{"mel", [1, 128, 1500]}}}, {"mel_1_1_1_128_2000_", {{"mel", [1, 128, 2000]}}}, {"mel_1_1_1_128_200_", {{"mel", [1, 128, 200]}}}, {"mel_1_1_1_128_3000_", {{"mel", [1, 128, 3000]}}}, {"mel_1_1_1_128_400_", {{"mel", [1, 128, 400]}}}, {"mel_1_1_1_128_600_", {{"mel", [1, 128, 600]}}}, {"mel_1_1_1_128_800_", {{"mel", [1, 128, 800]}}}})))] { tensor input_1_axes_0 = const()[name = tensor("input_1_axes_0"), val = tensor([1])]; tensor mel_to_fp16_dtype_0 = const()[name = tensor("mel_to_fp16_dtype_0"), val = tensor("fp16")]; tensor mel_to_fp16 = cast(dtype = mel_to_fp16_dtype_0, x = mel)[name = tensor("cast_2")]; tensor input_1_cast_fp16 = expand_dims(axes = input_1_axes_0, x = mel_to_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_71_pad_type_0 = const()[name = tensor("op_71_pad_type_0"), val = tensor("custom")]; tensor var_71_pad_0 = const()[name = tensor("op_71_pad_0"), val = tensor([1, 1, 1, 1])]; tensor var_71_strides_0 = const()[name = tensor("op_71_strides_0"), val = tensor([2, 2])]; tensor var_71_dilations_0 = const()[name = tensor("op_71_dilations_0"), val = tensor([1, 1])]; tensor var_71_groups_0 = const()[name = tensor("op_71_groups_0"), val = tensor(1)]; tensor conv2d1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4480))), name = tensor("conv2d1_weight_to_fp16_palettized"), shape = tensor([480, 1, 3, 3])]; tensor conv2d1_bias_to_fp16 = const()[name = tensor("conv2d1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5056)))]; tensor var_71_cast_fp16 = conv(bias = conv2d1_bias_to_fp16, dilations = var_71_dilations_0, groups = var_71_groups_0, pad = var_71_pad_0, pad_type = var_71_pad_type_0, strides = var_71_strides_0, weight = conv2d1_weight_to_fp16_palettized, x = input_1_cast_fp16)[name = tensor("op_71_cast_fp16")]; tensor input_3_mode_0 = const()[name = tensor("input_3_mode_0"), val = tensor("EXACT")]; tensor input_3_cast_fp16 = gelu(mode = input_3_mode_0, x = var_71_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor var_85_pad_type_0 = const()[name = tensor("op_85_pad_type_0"), val = tensor("custom")]; tensor var_85_pad_0 = const()[name = tensor("op_85_pad_0"), val = tensor([1, 1, 1, 1])]; tensor var_85_strides_0 = const()[name = tensor("op_85_strides_0"), val = tensor([2, 2])]; tensor var_85_dilations_0 = const()[name = tensor("op_85_dilations_0"), val = tensor([1, 1])]; tensor var_85_groups_0 = const()[name = tensor("op_85_groups_0"), val = tensor(1)]; tensor conv2d2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2079744))), name = tensor("conv2d2_weight_to_fp16_palettized"), shape = tensor([480, 480, 3, 3])]; tensor conv2d2_bias_to_fp16 = const()[name = tensor("conv2d2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2080320)))]; tensor var_85_cast_fp16 = conv(bias = conv2d2_bias_to_fp16, dilations = var_85_dilations_0, groups = var_85_groups_0, pad = var_85_pad_0, pad_type = var_85_pad_type_0, strides = var_85_strides_0, weight = conv2d2_weight_to_fp16_palettized, x = input_3_cast_fp16)[name = tensor("op_85_cast_fp16")]; tensor input_5_mode_0 = const()[name = tensor("input_5_mode_0"), val = tensor("EXACT")]; tensor input_5_cast_fp16 = gelu(mode = input_5_mode_0, x = var_85_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor var_99_pad_type_0 = const()[name = tensor("op_99_pad_type_0"), val = tensor("custom")]; tensor var_99_pad_0 = const()[name = tensor("op_99_pad_0"), val = tensor([1, 1, 1, 1])]; tensor var_99_strides_0 = const()[name = tensor("op_99_strides_0"), val = tensor([2, 2])]; tensor var_99_dilations_0 = const()[name = tensor("op_99_dilations_0"), val = tensor([1, 1])]; tensor var_99_groups_0 = const()[name = tensor("op_99_groups_0"), val = tensor(1)]; tensor conv2d3_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2081344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4155008))), name = tensor("conv2d3_weight_to_fp16_palettized"), shape = tensor([480, 480, 3, 3])]; tensor conv2d3_bias_to_fp16 = const()[name = tensor("conv2d3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4155584)))]; tensor var_99_cast_fp16 = conv(bias = conv2d3_bias_to_fp16, dilations = var_99_dilations_0, groups = var_99_groups_0, pad = var_99_pad_0, pad_type = var_99_pad_type_0, strides = var_99_strides_0, weight = conv2d3_weight_to_fp16_palettized, x = input_5_cast_fp16)[name = tensor("op_99_cast_fp16")]; tensor x_1_mode_0 = const()[name = tensor("x_1_mode_0"), val = tensor("EXACT")]; tensor x_1_cast_fp16 = gelu(mode = x_1_mode_0, x = var_99_cast_fp16)[name = tensor("x_1_cast_fp16")]; tensor var_120 = const()[name = tensor("op_120"), val = tensor([0, 3, 1, 2])]; tensor concat_0x = const()[name = tensor("concat_0x"), val = tensor([1, -1, 7680])]; tensor var_121_cast_fp16 = transpose(perm = var_120, x = x_1_cast_fp16)[name = tensor("transpose_240")]; tensor input_7_cast_fp16 = reshape(shape = concat_0x, x = var_121_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor conv_out_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4156608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12020992))), name = tensor("conv_out_weight_to_fp16_palettized"), shape = tensor([1024, 7680])]; tensor linear_0_bias_0_to_fp16 = const()[name = tensor("linear_0_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12021568)))]; tensor linear_0_cast_fp16 = linear(bias = linear_0_bias_0_to_fp16, weight = conv_out_weight_to_fp16_palettized, x = input_7_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_130_shape_cast_fp16 = shape(x = linear_0_cast_fp16)[name = tensor("op_130_shape_cast_fp16")]; tensor gather_4_axis_0 = const()[name = tensor("gather_4_axis_0"), val = tensor(0)]; tensor gather_4_batch_dims_0 = const()[name = tensor("gather_4_batch_dims_0"), val = tensor(0)]; tensor gather_4_validate_indices_0 = const()[name = tensor("gather_4_validate_indices_0"), val = tensor(false)]; tensor var_130_shape_cast_fp16_to_uint16_dtype_0 = const()[name = tensor("op_130_shape_cast_fp16_to_uint16_dtype_0"), val = tensor("uint16")]; tensor select_4_to_uint16 = const()[name = tensor("select_4_to_uint16"), val = tensor(1)]; tensor var_130_shape_cast_fp16_to_uint16 = cast(dtype = var_130_shape_cast_fp16_to_uint16_dtype_0, x = var_130_shape_cast_fp16)[name = tensor("cast_1")]; tensor gather_4_cast_uint16 = gather(axis = gather_4_axis_0, batch_dims = gather_4_batch_dims_0, indices = select_4_to_uint16, validate_indices = gather_4_validate_indices_0, x = var_130_shape_cast_fp16_to_uint16)[name = tensor("gather_4_cast_uint16")]; tensor gather_4_cast_uint16_to_int32_dtype_0 = const()[name = tensor("gather_4_cast_uint16_to_int32_dtype_0"), val = tensor("int32")]; tensor concat_1_values0_0 = const()[name = tensor("concat_1_values0_0"), val = tensor(1)]; tensor concat_1_values2_0 = const()[name = tensor("concat_1_values2_0"), val = tensor(1024)]; tensor concat_1_axis_0 = const()[name = tensor("concat_1_axis_0"), val = tensor(0)]; tensor concat_1_interleave_0 = const()[name = tensor("concat_1_interleave_0"), val = tensor(false)]; tensor gather_4_cast_uint16_to_int32 = cast(dtype = gather_4_cast_uint16_to_int32_dtype_0, x = gather_4_cast_uint16)[name = tensor("cast_0")]; tensor concat_1 = concat(axis = concat_1_axis_0, interleave = concat_1_interleave_0, values = (concat_1_values0_0, gather_4_cast_uint16_to_int32, concat_1_values2_0))[name = tensor("concat_1")]; tensor var_141_begin_0 = const()[name = tensor("op_141_begin_0"), val = tensor([0, 0, 0])]; tensor var_141_end_mask_0 = const()[name = tensor("op_141_end_mask_0"), val = tensor([true, false, true])]; tensor pos_embed_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12023680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13559744))), name = tensor("pos_embed_to_fp16_palettized"), shape = tensor([1, 1500, 1024])]; tensor var_141_cast_fp16 = slice_by_index(begin = var_141_begin_0, end = concat_1, end_mask = var_141_end_mask_0, x = pos_embed_to_fp16_palettized)[name = tensor("op_141_cast_fp16")]; tensor input_9_cast_fp16 = add(x = linear_0_cast_fp16, y = var_141_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor var_156 = const()[name = tensor("op_156"), val = tensor(-1)]; tensor x_5_axes_0 = const()[name = tensor("x_5_axes_0"), val = tensor([-1])]; tensor layers_0_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13560320)))]; tensor layers_0_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13562432)))]; tensor var_159_to_fp16 = const()[name = tensor("op_159_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_5_cast_fp16 = layer_norm(axes = x_5_axes_0, beta = layers_0_self_attn_layer_norm_bias_to_fp16, epsilon = var_159_to_fp16, gamma = layers_0_self_attn_layer_norm_weight_to_fp16, x = input_9_cast_fp16)[name = tensor("x_5_cast_fp16")]; tensor layers_0_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13564544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14613184))), name = tensor("layers_0_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14613760)))]; tensor linear_1_cast_fp16 = linear(bias = layers_0_self_attn_q_proj_bias_to_fp16, weight = layers_0_self_attn_q_proj_weight_to_fp16_palettized, x = x_5_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor concat_2x = const()[name = tensor("concat_2x"), val = tensor([1, -1, 16, 64])]; tensor var_180_cast_fp16 = reshape(shape = concat_2x, x = linear_1_cast_fp16)[name = tensor("op_180_cast_fp16")]; tensor layers_0_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14615872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15664512))), name = tensor("layers_0_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_0_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15665088)))]; tensor linear_2_cast_fp16 = linear(bias = layers_0_self_attn_k_proj_bias_to_fp16, weight = layers_0_self_attn_k_proj_weight_to_fp16_palettized, x = x_5_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor concat_3x = const()[name = tensor("concat_3x"), val = tensor([1, -1, 16, 64])]; tensor var_186_cast_fp16 = reshape(shape = concat_3x, x = linear_2_cast_fp16)[name = tensor("op_186_cast_fp16")]; tensor layers_0_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15667200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16715840))), name = tensor("layers_0_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16716416)))]; tensor linear_3_cast_fp16 = linear(bias = layers_0_self_attn_v_proj_bias_to_fp16, weight = layers_0_self_attn_v_proj_weight_to_fp16_palettized, x = x_5_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor concat_4x = const()[name = tensor("concat_4x"), val = tensor([1, -1, 16, 64])]; tensor var_192_cast_fp16 = reshape(shape = concat_4x, x = linear_3_cast_fp16)[name = tensor("op_192_cast_fp16")]; tensor v_1_perm_0 = const()[name = tensor("v_1_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_195_transpose_x_0 = const()[name = tensor("op_195_transpose_x_0"), val = tensor(false)]; tensor var_195_transpose_y_0 = const()[name = tensor("op_195_transpose_y_0"), val = tensor(false)]; tensor transpose_96_perm_0 = const()[name = tensor("transpose_96_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_97_perm_0 = const()[name = tensor("transpose_97_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_97 = transpose(perm = transpose_97_perm_0, x = var_186_cast_fp16)[name = tensor("transpose_238")]; tensor transpose_96 = transpose(perm = transpose_96_perm_0, x = var_180_cast_fp16)[name = tensor("transpose_239")]; tensor var_195_cast_fp16 = matmul(transpose_x = var_195_transpose_x_0, transpose_y = var_195_transpose_y_0, x = transpose_96, y = transpose_97)[name = tensor("op_195_cast_fp16")]; tensor var_196_to_fp16 = const()[name = tensor("op_196_to_fp16"), val = tensor(0x1p-3)]; tensor input_11_cast_fp16 = mul(x = var_195_cast_fp16, y = var_196_to_fp16)[name = tensor("input_11_cast_fp16")]; tensor attn_1_cast_fp16 = softmax(axis = var_156, x = input_11_cast_fp16)[name = tensor("attn_1_cast_fp16")]; tensor out_1_transpose_x_0 = const()[name = tensor("out_1_transpose_x_0"), val = tensor(false)]; tensor out_1_transpose_y_0 = const()[name = tensor("out_1_transpose_y_0"), val = tensor(false)]; tensor v_1_cast_fp16 = transpose(perm = v_1_perm_0, x = var_192_cast_fp16)[name = tensor("transpose_237")]; tensor out_1_cast_fp16 = matmul(transpose_x = out_1_transpose_x_0, transpose_y = out_1_transpose_y_0, x = attn_1_cast_fp16, y = v_1_cast_fp16)[name = tensor("out_1_cast_fp16")]; tensor var_200_perm_0 = const()[name = tensor("op_200_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_5x = const()[name = tensor("concat_5x"), val = tensor([1, -1, 1024])]; tensor var_200_cast_fp16 = transpose(perm = var_200_perm_0, x = out_1_cast_fp16)[name = tensor("transpose_236")]; tensor input_13_cast_fp16 = reshape(shape = concat_5x, x = var_200_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor layers_0_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16718528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17767168))), name = tensor("layers_0_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_0_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17767744)))]; tensor linear_4_cast_fp16 = linear(bias = layers_0_self_attn_out_proj_bias_to_fp16, weight = layers_0_self_attn_out_proj_weight_to_fp16_palettized, x = input_13_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor input_15_cast_fp16 = add(x = input_9_cast_fp16, y = linear_4_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor input_17_axes_0 = const()[name = tensor("input_17_axes_0"), val = tensor([-1])]; tensor layers_0_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_0_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17769856)))]; tensor layers_0_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_0_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17771968)))]; tensor input_17_cast_fp16 = layer_norm(axes = input_17_axes_0, beta = layers_0_final_layer_norm_bias_to_fp16, epsilon = var_159_to_fp16, gamma = layers_0_final_layer_norm_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor layers_0_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17774080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21968448))), name = tensor("layers_0_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_0_fc1_bias_to_fp16 = const()[name = tensor("layers_0_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21969024)))]; tensor linear_5_cast_fp16 = linear(bias = layers_0_fc1_bias_to_fp16, weight = layers_0_fc1_weight_to_fp16_palettized, x = input_17_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor input_19_mode_0 = const()[name = tensor("input_19_mode_0"), val = tensor("EXACT")]; tensor input_19_cast_fp16 = gelu(mode = input_19_mode_0, x = linear_5_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor layers_0_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21977280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26171648))), name = tensor("layers_0_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_0_fc2_bias_to_fp16 = const()[name = tensor("layers_0_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26172224)))]; tensor linear_6_cast_fp16 = linear(bias = layers_0_fc2_bias_to_fp16, weight = layers_0_fc2_weight_to_fp16_palettized, x = input_19_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor input_21_cast_fp16 = add(x = input_15_cast_fp16, y = linear_6_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_226 = const()[name = tensor("op_226"), val = tensor(-1)]; tensor x_11_axes_0 = const()[name = tensor("x_11_axes_0"), val = tensor([-1])]; tensor layers_1_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_1_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26174336)))]; tensor layers_1_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26176448)))]; tensor var_229_to_fp16 = const()[name = tensor("op_229_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_11_cast_fp16 = layer_norm(axes = x_11_axes_0, beta = layers_1_self_attn_layer_norm_bias_to_fp16, epsilon = var_229_to_fp16, gamma = layers_1_self_attn_layer_norm_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor layers_1_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26178560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27227200))), name = tensor("layers_1_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27227776)))]; tensor linear_7_cast_fp16 = linear(bias = layers_1_self_attn_q_proj_bias_to_fp16, weight = layers_1_self_attn_q_proj_weight_to_fp16_palettized, x = x_11_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor concat_6x = const()[name = tensor("concat_6x"), val = tensor([1, -1, 16, 64])]; tensor var_250_cast_fp16 = reshape(shape = concat_6x, x = linear_7_cast_fp16)[name = tensor("op_250_cast_fp16")]; tensor layers_1_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27229888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28278528))), name = tensor("layers_1_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_1_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28279104)))]; tensor linear_8_cast_fp16 = linear(bias = layers_1_self_attn_k_proj_bias_to_fp16, weight = layers_1_self_attn_k_proj_weight_to_fp16_palettized, x = x_11_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor concat_7x = const()[name = tensor("concat_7x"), val = tensor([1, -1, 16, 64])]; tensor var_256_cast_fp16 = reshape(shape = concat_7x, x = linear_8_cast_fp16)[name = tensor("op_256_cast_fp16")]; tensor layers_1_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28281216))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29329856))), name = tensor("layers_1_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29330432)))]; tensor linear_9_cast_fp16 = linear(bias = layers_1_self_attn_v_proj_bias_to_fp16, weight = layers_1_self_attn_v_proj_weight_to_fp16_palettized, x = x_11_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor concat_8x = const()[name = tensor("concat_8x"), val = tensor([1, -1, 16, 64])]; tensor var_262_cast_fp16 = reshape(shape = concat_8x, x = linear_9_cast_fp16)[name = tensor("op_262_cast_fp16")]; tensor v_3_perm_0 = const()[name = tensor("v_3_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_265_transpose_x_0 = const()[name = tensor("op_265_transpose_x_0"), val = tensor(false)]; tensor var_265_transpose_y_0 = const()[name = tensor("op_265_transpose_y_0"), val = tensor(false)]; tensor transpose_98_perm_0 = const()[name = tensor("transpose_98_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_99_perm_0 = const()[name = tensor("transpose_99_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_99 = transpose(perm = transpose_99_perm_0, x = var_256_cast_fp16)[name = tensor("transpose_234")]; tensor transpose_98 = transpose(perm = transpose_98_perm_0, x = var_250_cast_fp16)[name = tensor("transpose_235")]; tensor var_265_cast_fp16 = matmul(transpose_x = var_265_transpose_x_0, transpose_y = var_265_transpose_y_0, x = transpose_98, y = transpose_99)[name = tensor("op_265_cast_fp16")]; tensor var_266_to_fp16 = const()[name = tensor("op_266_to_fp16"), val = tensor(0x1p-3)]; tensor input_23_cast_fp16 = mul(x = var_265_cast_fp16, y = var_266_to_fp16)[name = tensor("input_23_cast_fp16")]; tensor attn_3_cast_fp16 = softmax(axis = var_226, x = input_23_cast_fp16)[name = tensor("attn_3_cast_fp16")]; tensor out_3_transpose_x_0 = const()[name = tensor("out_3_transpose_x_0"), val = tensor(false)]; tensor out_3_transpose_y_0 = const()[name = tensor("out_3_transpose_y_0"), val = tensor(false)]; tensor v_3_cast_fp16 = transpose(perm = v_3_perm_0, x = var_262_cast_fp16)[name = tensor("transpose_233")]; tensor out_3_cast_fp16 = matmul(transpose_x = out_3_transpose_x_0, transpose_y = out_3_transpose_y_0, x = attn_3_cast_fp16, y = v_3_cast_fp16)[name = tensor("out_3_cast_fp16")]; tensor var_270_perm_0 = const()[name = tensor("op_270_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_9x = const()[name = tensor("concat_9x"), val = tensor([1, -1, 1024])]; tensor var_270_cast_fp16 = transpose(perm = var_270_perm_0, x = out_3_cast_fp16)[name = tensor("transpose_232")]; tensor input_25_cast_fp16 = reshape(shape = concat_9x, x = var_270_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor layers_1_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29332544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30381184))), name = tensor("layers_1_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_1_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30381760)))]; tensor linear_10_cast_fp16 = linear(bias = layers_1_self_attn_out_proj_bias_to_fp16, weight = layers_1_self_attn_out_proj_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_27_cast_fp16 = add(x = input_21_cast_fp16, y = linear_10_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_axes_0 = const()[name = tensor("input_29_axes_0"), val = tensor([-1])]; tensor layers_1_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_1_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30383872)))]; tensor layers_1_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_1_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30385984)))]; tensor input_29_cast_fp16 = layer_norm(axes = input_29_axes_0, beta = layers_1_final_layer_norm_bias_to_fp16, epsilon = var_229_to_fp16, gamma = layers_1_final_layer_norm_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor layers_1_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30388096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34582464))), name = tensor("layers_1_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_1_fc1_bias_to_fp16 = const()[name = tensor("layers_1_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34583040)))]; tensor linear_11_cast_fp16 = linear(bias = layers_1_fc1_bias_to_fp16, weight = layers_1_fc1_weight_to_fp16_palettized, x = input_29_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = linear_11_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor layers_1_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34591296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38785664))), name = tensor("layers_1_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_1_fc2_bias_to_fp16 = const()[name = tensor("layers_1_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38786240)))]; tensor linear_12_cast_fp16 = linear(bias = layers_1_fc2_bias_to_fp16, weight = layers_1_fc2_weight_to_fp16_palettized, x = input_31_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor input_33_cast_fp16 = add(x = input_27_cast_fp16, y = linear_12_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor var_296 = const()[name = tensor("op_296"), val = tensor(-1)]; tensor x_17_axes_0 = const()[name = tensor("x_17_axes_0"), val = tensor([-1])]; tensor layers_2_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_2_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38788352)))]; tensor layers_2_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38790464)))]; tensor var_299_to_fp16 = const()[name = tensor("op_299_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_17_cast_fp16 = layer_norm(axes = x_17_axes_0, beta = layers_2_self_attn_layer_norm_bias_to_fp16, epsilon = var_299_to_fp16, gamma = layers_2_self_attn_layer_norm_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor layers_2_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38792576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39841216))), name = tensor("layers_2_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39841792)))]; tensor linear_13_cast_fp16 = linear(bias = layers_2_self_attn_q_proj_bias_to_fp16, weight = layers_2_self_attn_q_proj_weight_to_fp16_palettized, x = x_17_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor concat_10x = const()[name = tensor("concat_10x"), val = tensor([1, -1, 16, 64])]; tensor var_320_cast_fp16 = reshape(shape = concat_10x, x = linear_13_cast_fp16)[name = tensor("op_320_cast_fp16")]; tensor layers_2_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39843904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40892544))), name = tensor("layers_2_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_2_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40893120)))]; tensor linear_14_cast_fp16 = linear(bias = layers_2_self_attn_k_proj_bias_to_fp16, weight = layers_2_self_attn_k_proj_weight_to_fp16_palettized, x = x_17_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor concat_11x = const()[name = tensor("concat_11x"), val = tensor([1, -1, 16, 64])]; tensor var_326_cast_fp16 = reshape(shape = concat_11x, x = linear_14_cast_fp16)[name = tensor("op_326_cast_fp16")]; tensor layers_2_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40895232))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41943872))), name = tensor("layers_2_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41944448)))]; tensor linear_15_cast_fp16 = linear(bias = layers_2_self_attn_v_proj_bias_to_fp16, weight = layers_2_self_attn_v_proj_weight_to_fp16_palettized, x = x_17_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor concat_12x = const()[name = tensor("concat_12x"), val = tensor([1, -1, 16, 64])]; tensor var_332_cast_fp16 = reshape(shape = concat_12x, x = linear_15_cast_fp16)[name = tensor("op_332_cast_fp16")]; tensor v_5_perm_0 = const()[name = tensor("v_5_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_335_transpose_x_0 = const()[name = tensor("op_335_transpose_x_0"), val = tensor(false)]; tensor var_335_transpose_y_0 = const()[name = tensor("op_335_transpose_y_0"), val = tensor(false)]; tensor transpose_100_perm_0 = const()[name = tensor("transpose_100_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_101_perm_0 = const()[name = tensor("transpose_101_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_101 = transpose(perm = transpose_101_perm_0, x = var_326_cast_fp16)[name = tensor("transpose_230")]; tensor transpose_100 = transpose(perm = transpose_100_perm_0, x = var_320_cast_fp16)[name = tensor("transpose_231")]; tensor var_335_cast_fp16 = matmul(transpose_x = var_335_transpose_x_0, transpose_y = var_335_transpose_y_0, x = transpose_100, y = transpose_101)[name = tensor("op_335_cast_fp16")]; tensor var_336_to_fp16 = const()[name = tensor("op_336_to_fp16"), val = tensor(0x1p-3)]; tensor input_35_cast_fp16 = mul(x = var_335_cast_fp16, y = var_336_to_fp16)[name = tensor("input_35_cast_fp16")]; tensor attn_5_cast_fp16 = softmax(axis = var_296, x = input_35_cast_fp16)[name = tensor("attn_5_cast_fp16")]; tensor out_5_transpose_x_0 = const()[name = tensor("out_5_transpose_x_0"), val = tensor(false)]; tensor out_5_transpose_y_0 = const()[name = tensor("out_5_transpose_y_0"), val = tensor(false)]; tensor v_5_cast_fp16 = transpose(perm = v_5_perm_0, x = var_332_cast_fp16)[name = tensor("transpose_229")]; tensor out_5_cast_fp16 = matmul(transpose_x = out_5_transpose_x_0, transpose_y = out_5_transpose_y_0, x = attn_5_cast_fp16, y = v_5_cast_fp16)[name = tensor("out_5_cast_fp16")]; tensor var_340_perm_0 = const()[name = tensor("op_340_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_13x = const()[name = tensor("concat_13x"), val = tensor([1, -1, 1024])]; tensor var_340_cast_fp16 = transpose(perm = var_340_perm_0, x = out_5_cast_fp16)[name = tensor("transpose_228")]; tensor input_37_cast_fp16 = reshape(shape = concat_13x, x = var_340_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor layers_2_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41946560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42995200))), name = tensor("layers_2_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_2_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42995776)))]; tensor linear_16_cast_fp16 = linear(bias = layers_2_self_attn_out_proj_bias_to_fp16, weight = layers_2_self_attn_out_proj_weight_to_fp16_palettized, x = input_37_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_39_cast_fp16 = add(x = input_33_cast_fp16, y = linear_16_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_41_axes_0 = const()[name = tensor("input_41_axes_0"), val = tensor([-1])]; tensor layers_2_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_2_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42997888)))]; tensor layers_2_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_2_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43000000)))]; tensor input_41_cast_fp16 = layer_norm(axes = input_41_axes_0, beta = layers_2_final_layer_norm_bias_to_fp16, epsilon = var_299_to_fp16, gamma = layers_2_final_layer_norm_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor layers_2_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43002112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47196480))), name = tensor("layers_2_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_2_fc1_bias_to_fp16 = const()[name = tensor("layers_2_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47197056)))]; tensor linear_17_cast_fp16 = linear(bias = layers_2_fc1_bias_to_fp16, weight = layers_2_fc1_weight_to_fp16_palettized, x = input_41_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor input_43_mode_0 = const()[name = tensor("input_43_mode_0"), val = tensor("EXACT")]; tensor input_43_cast_fp16 = gelu(mode = input_43_mode_0, x = linear_17_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor layers_2_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47205312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51399680))), name = tensor("layers_2_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_2_fc2_bias_to_fp16 = const()[name = tensor("layers_2_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51400256)))]; tensor linear_18_cast_fp16 = linear(bias = layers_2_fc2_bias_to_fp16, weight = layers_2_fc2_weight_to_fp16_palettized, x = input_43_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor input_45_cast_fp16 = add(x = input_39_cast_fp16, y = linear_18_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor var_366 = const()[name = tensor("op_366"), val = tensor(-1)]; tensor x_23_axes_0 = const()[name = tensor("x_23_axes_0"), val = tensor([-1])]; tensor layers_3_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_3_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51402368)))]; tensor layers_3_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51404480)))]; tensor var_369_to_fp16 = const()[name = tensor("op_369_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_23_cast_fp16 = layer_norm(axes = x_23_axes_0, beta = layers_3_self_attn_layer_norm_bias_to_fp16, epsilon = var_369_to_fp16, gamma = layers_3_self_attn_layer_norm_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("x_23_cast_fp16")]; tensor layers_3_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51406592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52455232))), name = tensor("layers_3_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52455808)))]; tensor linear_19_cast_fp16 = linear(bias = layers_3_self_attn_q_proj_bias_to_fp16, weight = layers_3_self_attn_q_proj_weight_to_fp16_palettized, x = x_23_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor concat_14x = const()[name = tensor("concat_14x"), val = tensor([1, -1, 16, 64])]; tensor var_390_cast_fp16 = reshape(shape = concat_14x, x = linear_19_cast_fp16)[name = tensor("op_390_cast_fp16")]; tensor layers_3_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52457920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53506560))), name = tensor("layers_3_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_3_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53507136)))]; tensor linear_20_cast_fp16 = linear(bias = layers_3_self_attn_k_proj_bias_to_fp16, weight = layers_3_self_attn_k_proj_weight_to_fp16_palettized, x = x_23_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor concat_15x = const()[name = tensor("concat_15x"), val = tensor([1, -1, 16, 64])]; tensor var_396_cast_fp16 = reshape(shape = concat_15x, x = linear_20_cast_fp16)[name = tensor("op_396_cast_fp16")]; tensor layers_3_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53509248))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54557888))), name = tensor("layers_3_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54558464)))]; tensor linear_21_cast_fp16 = linear(bias = layers_3_self_attn_v_proj_bias_to_fp16, weight = layers_3_self_attn_v_proj_weight_to_fp16_palettized, x = x_23_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor concat_16x = const()[name = tensor("concat_16x"), val = tensor([1, -1, 16, 64])]; tensor var_402_cast_fp16 = reshape(shape = concat_16x, x = linear_21_cast_fp16)[name = tensor("op_402_cast_fp16")]; tensor v_7_perm_0 = const()[name = tensor("v_7_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_405_transpose_x_0 = const()[name = tensor("op_405_transpose_x_0"), val = tensor(false)]; tensor var_405_transpose_y_0 = const()[name = tensor("op_405_transpose_y_0"), val = tensor(false)]; tensor transpose_102_perm_0 = const()[name = tensor("transpose_102_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_103_perm_0 = const()[name = tensor("transpose_103_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_103 = transpose(perm = transpose_103_perm_0, x = var_396_cast_fp16)[name = tensor("transpose_226")]; tensor transpose_102 = transpose(perm = transpose_102_perm_0, x = var_390_cast_fp16)[name = tensor("transpose_227")]; tensor var_405_cast_fp16 = matmul(transpose_x = var_405_transpose_x_0, transpose_y = var_405_transpose_y_0, x = transpose_102, y = transpose_103)[name = tensor("op_405_cast_fp16")]; tensor var_406_to_fp16 = const()[name = tensor("op_406_to_fp16"), val = tensor(0x1p-3)]; tensor input_47_cast_fp16 = mul(x = var_405_cast_fp16, y = var_406_to_fp16)[name = tensor("input_47_cast_fp16")]; tensor attn_7_cast_fp16 = softmax(axis = var_366, x = input_47_cast_fp16)[name = tensor("attn_7_cast_fp16")]; tensor out_7_transpose_x_0 = const()[name = tensor("out_7_transpose_x_0"), val = tensor(false)]; tensor out_7_transpose_y_0 = const()[name = tensor("out_7_transpose_y_0"), val = tensor(false)]; tensor v_7_cast_fp16 = transpose(perm = v_7_perm_0, x = var_402_cast_fp16)[name = tensor("transpose_225")]; tensor out_7_cast_fp16 = matmul(transpose_x = out_7_transpose_x_0, transpose_y = out_7_transpose_y_0, x = attn_7_cast_fp16, y = v_7_cast_fp16)[name = tensor("out_7_cast_fp16")]; tensor var_410_perm_0 = const()[name = tensor("op_410_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_17x = const()[name = tensor("concat_17x"), val = tensor([1, -1, 1024])]; tensor var_410_cast_fp16 = transpose(perm = var_410_perm_0, x = out_7_cast_fp16)[name = tensor("transpose_224")]; tensor input_49_cast_fp16 = reshape(shape = concat_17x, x = var_410_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor layers_3_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54560576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55609216))), name = tensor("layers_3_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_3_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55609792)))]; tensor linear_22_cast_fp16 = linear(bias = layers_3_self_attn_out_proj_bias_to_fp16, weight = layers_3_self_attn_out_proj_weight_to_fp16_palettized, x = input_49_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor input_51_cast_fp16 = add(x = input_45_cast_fp16, y = linear_22_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor input_53_axes_0 = const()[name = tensor("input_53_axes_0"), val = tensor([-1])]; tensor layers_3_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_3_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55611904)))]; tensor layers_3_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_3_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55614016)))]; tensor input_53_cast_fp16 = layer_norm(axes = input_53_axes_0, beta = layers_3_final_layer_norm_bias_to_fp16, epsilon = var_369_to_fp16, gamma = layers_3_final_layer_norm_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor layers_3_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55616128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59810496))), name = tensor("layers_3_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_3_fc1_bias_to_fp16 = const()[name = tensor("layers_3_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59811072)))]; tensor linear_23_cast_fp16 = linear(bias = layers_3_fc1_bias_to_fp16, weight = layers_3_fc1_weight_to_fp16_palettized, x = input_53_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor input_55_mode_0 = const()[name = tensor("input_55_mode_0"), val = tensor("EXACT")]; tensor input_55_cast_fp16 = gelu(mode = input_55_mode_0, x = linear_23_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor layers_3_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59819328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64013696))), name = tensor("layers_3_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_3_fc2_bias_to_fp16 = const()[name = tensor("layers_3_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64014272)))]; tensor linear_24_cast_fp16 = linear(bias = layers_3_fc2_bias_to_fp16, weight = layers_3_fc2_weight_to_fp16_palettized, x = input_55_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor input_57_cast_fp16 = add(x = input_51_cast_fp16, y = linear_24_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor var_436 = const()[name = tensor("op_436"), val = tensor(-1)]; tensor x_29_axes_0 = const()[name = tensor("x_29_axes_0"), val = tensor([-1])]; tensor layers_4_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_4_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64016384)))]; tensor layers_4_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64018496)))]; tensor var_439_to_fp16 = const()[name = tensor("op_439_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_29_cast_fp16 = layer_norm(axes = x_29_axes_0, beta = layers_4_self_attn_layer_norm_bias_to_fp16, epsilon = var_439_to_fp16, gamma = layers_4_self_attn_layer_norm_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("x_29_cast_fp16")]; tensor layers_4_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64020608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65069248))), name = tensor("layers_4_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65069824)))]; tensor linear_25_cast_fp16 = linear(bias = layers_4_self_attn_q_proj_bias_to_fp16, weight = layers_4_self_attn_q_proj_weight_to_fp16_palettized, x = x_29_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor concat_18x = const()[name = tensor("concat_18x"), val = tensor([1, -1, 16, 64])]; tensor var_460_cast_fp16 = reshape(shape = concat_18x, x = linear_25_cast_fp16)[name = tensor("op_460_cast_fp16")]; tensor layers_4_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65071936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66120576))), name = tensor("layers_4_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_4_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66121152)))]; tensor linear_26_cast_fp16 = linear(bias = layers_4_self_attn_k_proj_bias_to_fp16, weight = layers_4_self_attn_k_proj_weight_to_fp16_palettized, x = x_29_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor concat_19x = const()[name = tensor("concat_19x"), val = tensor([1, -1, 16, 64])]; tensor var_466_cast_fp16 = reshape(shape = concat_19x, x = linear_26_cast_fp16)[name = tensor("op_466_cast_fp16")]; tensor layers_4_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66123264))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67171904))), name = tensor("layers_4_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67172480)))]; tensor linear_27_cast_fp16 = linear(bias = layers_4_self_attn_v_proj_bias_to_fp16, weight = layers_4_self_attn_v_proj_weight_to_fp16_palettized, x = x_29_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor concat_20x = const()[name = tensor("concat_20x"), val = tensor([1, -1, 16, 64])]; tensor var_472_cast_fp16 = reshape(shape = concat_20x, x = linear_27_cast_fp16)[name = tensor("op_472_cast_fp16")]; tensor v_9_perm_0 = const()[name = tensor("v_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_475_transpose_x_0 = const()[name = tensor("op_475_transpose_x_0"), val = tensor(false)]; tensor var_475_transpose_y_0 = const()[name = tensor("op_475_transpose_y_0"), val = tensor(false)]; tensor transpose_104_perm_0 = const()[name = tensor("transpose_104_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_105_perm_0 = const()[name = tensor("transpose_105_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_105 = transpose(perm = transpose_105_perm_0, x = var_466_cast_fp16)[name = tensor("transpose_222")]; tensor transpose_104 = transpose(perm = transpose_104_perm_0, x = var_460_cast_fp16)[name = tensor("transpose_223")]; tensor var_475_cast_fp16 = matmul(transpose_x = var_475_transpose_x_0, transpose_y = var_475_transpose_y_0, x = transpose_104, y = transpose_105)[name = tensor("op_475_cast_fp16")]; tensor var_476_to_fp16 = const()[name = tensor("op_476_to_fp16"), val = tensor(0x1p-3)]; tensor input_59_cast_fp16 = mul(x = var_475_cast_fp16, y = var_476_to_fp16)[name = tensor("input_59_cast_fp16")]; tensor attn_9_cast_fp16 = softmax(axis = var_436, x = input_59_cast_fp16)[name = tensor("attn_9_cast_fp16")]; tensor out_9_transpose_x_0 = const()[name = tensor("out_9_transpose_x_0"), val = tensor(false)]; tensor out_9_transpose_y_0 = const()[name = tensor("out_9_transpose_y_0"), val = tensor(false)]; tensor v_9_cast_fp16 = transpose(perm = v_9_perm_0, x = var_472_cast_fp16)[name = tensor("transpose_221")]; tensor out_9_cast_fp16 = matmul(transpose_x = out_9_transpose_x_0, transpose_y = out_9_transpose_y_0, x = attn_9_cast_fp16, y = v_9_cast_fp16)[name = tensor("out_9_cast_fp16")]; tensor var_480_perm_0 = const()[name = tensor("op_480_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_21x = const()[name = tensor("concat_21x"), val = tensor([1, -1, 1024])]; tensor var_480_cast_fp16 = transpose(perm = var_480_perm_0, x = out_9_cast_fp16)[name = tensor("transpose_220")]; tensor input_61_cast_fp16 = reshape(shape = concat_21x, x = var_480_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor layers_4_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67174592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68223232))), name = tensor("layers_4_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_4_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68223808)))]; tensor linear_28_cast_fp16 = linear(bias = layers_4_self_attn_out_proj_bias_to_fp16, weight = layers_4_self_attn_out_proj_weight_to_fp16_palettized, x = input_61_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor input_63_cast_fp16 = add(x = input_57_cast_fp16, y = linear_28_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor input_65_axes_0 = const()[name = tensor("input_65_axes_0"), val = tensor([-1])]; tensor layers_4_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_4_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68225920)))]; tensor layers_4_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_4_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68228032)))]; tensor input_65_cast_fp16 = layer_norm(axes = input_65_axes_0, beta = layers_4_final_layer_norm_bias_to_fp16, epsilon = var_439_to_fp16, gamma = layers_4_final_layer_norm_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor layers_4_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68230144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72424512))), name = tensor("layers_4_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_4_fc1_bias_to_fp16 = const()[name = tensor("layers_4_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72425088)))]; tensor linear_29_cast_fp16 = linear(bias = layers_4_fc1_bias_to_fp16, weight = layers_4_fc1_weight_to_fp16_palettized, x = input_65_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor input_67_mode_0 = const()[name = tensor("input_67_mode_0"), val = tensor("EXACT")]; tensor input_67_cast_fp16 = gelu(mode = input_67_mode_0, x = linear_29_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor layers_4_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72433344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76627712))), name = tensor("layers_4_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_4_fc2_bias_to_fp16 = const()[name = tensor("layers_4_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76628288)))]; tensor linear_30_cast_fp16 = linear(bias = layers_4_fc2_bias_to_fp16, weight = layers_4_fc2_weight_to_fp16_palettized, x = input_67_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor input_69_cast_fp16 = add(x = input_63_cast_fp16, y = linear_30_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor var_506 = const()[name = tensor("op_506"), val = tensor(-1)]; tensor x_35_axes_0 = const()[name = tensor("x_35_axes_0"), val = tensor([-1])]; tensor layers_5_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_5_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76630400)))]; tensor layers_5_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76632512)))]; tensor var_509_to_fp16 = const()[name = tensor("op_509_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_35_cast_fp16 = layer_norm(axes = x_35_axes_0, beta = layers_5_self_attn_layer_norm_bias_to_fp16, epsilon = var_509_to_fp16, gamma = layers_5_self_attn_layer_norm_weight_to_fp16, x = input_69_cast_fp16)[name = tensor("x_35_cast_fp16")]; tensor layers_5_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76634624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77683264))), name = tensor("layers_5_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77683840)))]; tensor linear_31_cast_fp16 = linear(bias = layers_5_self_attn_q_proj_bias_to_fp16, weight = layers_5_self_attn_q_proj_weight_to_fp16_palettized, x = x_35_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor concat_22x = const()[name = tensor("concat_22x"), val = tensor([1, -1, 16, 64])]; tensor var_530_cast_fp16 = reshape(shape = concat_22x, x = linear_31_cast_fp16)[name = tensor("op_530_cast_fp16")]; tensor layers_5_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77685952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78734592))), name = tensor("layers_5_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_5_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78735168)))]; tensor linear_32_cast_fp16 = linear(bias = layers_5_self_attn_k_proj_bias_to_fp16, weight = layers_5_self_attn_k_proj_weight_to_fp16_palettized, x = x_35_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor concat_23x = const()[name = tensor("concat_23x"), val = tensor([1, -1, 16, 64])]; tensor var_536_cast_fp16 = reshape(shape = concat_23x, x = linear_32_cast_fp16)[name = tensor("op_536_cast_fp16")]; tensor layers_5_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78737280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79785920))), name = tensor("layers_5_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79786496)))]; tensor linear_33_cast_fp16 = linear(bias = layers_5_self_attn_v_proj_bias_to_fp16, weight = layers_5_self_attn_v_proj_weight_to_fp16_palettized, x = x_35_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor concat_24x = const()[name = tensor("concat_24x"), val = tensor([1, -1, 16, 64])]; tensor var_542_cast_fp16 = reshape(shape = concat_24x, x = linear_33_cast_fp16)[name = tensor("op_542_cast_fp16")]; tensor v_11_perm_0 = const()[name = tensor("v_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_545_transpose_x_0 = const()[name = tensor("op_545_transpose_x_0"), val = tensor(false)]; tensor var_545_transpose_y_0 = const()[name = tensor("op_545_transpose_y_0"), val = tensor(false)]; tensor transpose_106_perm_0 = const()[name = tensor("transpose_106_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_107_perm_0 = const()[name = tensor("transpose_107_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_107 = transpose(perm = transpose_107_perm_0, x = var_536_cast_fp16)[name = tensor("transpose_218")]; tensor transpose_106 = transpose(perm = transpose_106_perm_0, x = var_530_cast_fp16)[name = tensor("transpose_219")]; tensor var_545_cast_fp16 = matmul(transpose_x = var_545_transpose_x_0, transpose_y = var_545_transpose_y_0, x = transpose_106, y = transpose_107)[name = tensor("op_545_cast_fp16")]; tensor var_546_to_fp16 = const()[name = tensor("op_546_to_fp16"), val = tensor(0x1p-3)]; tensor input_71_cast_fp16 = mul(x = var_545_cast_fp16, y = var_546_to_fp16)[name = tensor("input_71_cast_fp16")]; tensor attn_11_cast_fp16 = softmax(axis = var_506, x = input_71_cast_fp16)[name = tensor("attn_11_cast_fp16")]; tensor out_11_transpose_x_0 = const()[name = tensor("out_11_transpose_x_0"), val = tensor(false)]; tensor out_11_transpose_y_0 = const()[name = tensor("out_11_transpose_y_0"), val = tensor(false)]; tensor v_11_cast_fp16 = transpose(perm = v_11_perm_0, x = var_542_cast_fp16)[name = tensor("transpose_217")]; tensor out_11_cast_fp16 = matmul(transpose_x = out_11_transpose_x_0, transpose_y = out_11_transpose_y_0, x = attn_11_cast_fp16, y = v_11_cast_fp16)[name = tensor("out_11_cast_fp16")]; tensor var_550_perm_0 = const()[name = tensor("op_550_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_25x = const()[name = tensor("concat_25x"), val = tensor([1, -1, 1024])]; tensor var_550_cast_fp16 = transpose(perm = var_550_perm_0, x = out_11_cast_fp16)[name = tensor("transpose_216")]; tensor input_73_cast_fp16 = reshape(shape = concat_25x, x = var_550_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor layers_5_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79788608))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80837248))), name = tensor("layers_5_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_5_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80837824)))]; tensor linear_34_cast_fp16 = linear(bias = layers_5_self_attn_out_proj_bias_to_fp16, weight = layers_5_self_attn_out_proj_weight_to_fp16_palettized, x = input_73_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_69_cast_fp16, y = linear_34_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor input_77_axes_0 = const()[name = tensor("input_77_axes_0"), val = tensor([-1])]; tensor layers_5_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_5_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80839936)))]; tensor layers_5_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_5_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80842048)))]; tensor input_77_cast_fp16 = layer_norm(axes = input_77_axes_0, beta = layers_5_final_layer_norm_bias_to_fp16, epsilon = var_509_to_fp16, gamma = layers_5_final_layer_norm_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor layers_5_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80844160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85038528))), name = tensor("layers_5_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_5_fc1_bias_to_fp16 = const()[name = tensor("layers_5_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85039104)))]; tensor linear_35_cast_fp16 = linear(bias = layers_5_fc1_bias_to_fp16, weight = layers_5_fc1_weight_to_fp16_palettized, x = input_77_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_79_mode_0 = const()[name = tensor("input_79_mode_0"), val = tensor("EXACT")]; tensor input_79_cast_fp16 = gelu(mode = input_79_mode_0, x = linear_35_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor layers_5_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85047360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89241728))), name = tensor("layers_5_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_5_fc2_bias_to_fp16 = const()[name = tensor("layers_5_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89242304)))]; tensor linear_36_cast_fp16 = linear(bias = layers_5_fc2_bias_to_fp16, weight = layers_5_fc2_weight_to_fp16_palettized, x = input_79_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor input_81_cast_fp16 = add(x = input_75_cast_fp16, y = linear_36_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor var_576 = const()[name = tensor("op_576"), val = tensor(-1)]; tensor x_41_axes_0 = const()[name = tensor("x_41_axes_0"), val = tensor([-1])]; tensor layers_6_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_6_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89244416)))]; tensor layers_6_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89246528)))]; tensor var_579_to_fp16 = const()[name = tensor("op_579_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_41_cast_fp16 = layer_norm(axes = x_41_axes_0, beta = layers_6_self_attn_layer_norm_bias_to_fp16, epsilon = var_579_to_fp16, gamma = layers_6_self_attn_layer_norm_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor layers_6_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89248640))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90297280))), name = tensor("layers_6_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90297856)))]; tensor linear_37_cast_fp16 = linear(bias = layers_6_self_attn_q_proj_bias_to_fp16, weight = layers_6_self_attn_q_proj_weight_to_fp16_palettized, x = x_41_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor concat_26x = const()[name = tensor("concat_26x"), val = tensor([1, -1, 16, 64])]; tensor var_600_cast_fp16 = reshape(shape = concat_26x, x = linear_37_cast_fp16)[name = tensor("op_600_cast_fp16")]; tensor layers_6_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90299968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91348608))), name = tensor("layers_6_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_6_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91349184)))]; tensor linear_38_cast_fp16 = linear(bias = layers_6_self_attn_k_proj_bias_to_fp16, weight = layers_6_self_attn_k_proj_weight_to_fp16_palettized, x = x_41_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor concat_27x = const()[name = tensor("concat_27x"), val = tensor([1, -1, 16, 64])]; tensor var_606_cast_fp16 = reshape(shape = concat_27x, x = linear_38_cast_fp16)[name = tensor("op_606_cast_fp16")]; tensor layers_6_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91351296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92399936))), name = tensor("layers_6_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92400512)))]; tensor linear_39_cast_fp16 = linear(bias = layers_6_self_attn_v_proj_bias_to_fp16, weight = layers_6_self_attn_v_proj_weight_to_fp16_palettized, x = x_41_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor concat_28x = const()[name = tensor("concat_28x"), val = tensor([1, -1, 16, 64])]; tensor var_612_cast_fp16 = reshape(shape = concat_28x, x = linear_39_cast_fp16)[name = tensor("op_612_cast_fp16")]; tensor v_13_perm_0 = const()[name = tensor("v_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_615_transpose_x_0 = const()[name = tensor("op_615_transpose_x_0"), val = tensor(false)]; tensor var_615_transpose_y_0 = const()[name = tensor("op_615_transpose_y_0"), val = tensor(false)]; tensor transpose_108_perm_0 = const()[name = tensor("transpose_108_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_109_perm_0 = const()[name = tensor("transpose_109_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_109 = transpose(perm = transpose_109_perm_0, x = var_606_cast_fp16)[name = tensor("transpose_214")]; tensor transpose_108 = transpose(perm = transpose_108_perm_0, x = var_600_cast_fp16)[name = tensor("transpose_215")]; tensor var_615_cast_fp16 = matmul(transpose_x = var_615_transpose_x_0, transpose_y = var_615_transpose_y_0, x = transpose_108, y = transpose_109)[name = tensor("op_615_cast_fp16")]; tensor var_616_to_fp16 = const()[name = tensor("op_616_to_fp16"), val = tensor(0x1p-3)]; tensor input_83_cast_fp16 = mul(x = var_615_cast_fp16, y = var_616_to_fp16)[name = tensor("input_83_cast_fp16")]; tensor attn_13_cast_fp16 = softmax(axis = var_576, x = input_83_cast_fp16)[name = tensor("attn_13_cast_fp16")]; tensor out_13_transpose_x_0 = const()[name = tensor("out_13_transpose_x_0"), val = tensor(false)]; tensor out_13_transpose_y_0 = const()[name = tensor("out_13_transpose_y_0"), val = tensor(false)]; tensor v_13_cast_fp16 = transpose(perm = v_13_perm_0, x = var_612_cast_fp16)[name = tensor("transpose_213")]; tensor out_13_cast_fp16 = matmul(transpose_x = out_13_transpose_x_0, transpose_y = out_13_transpose_y_0, x = attn_13_cast_fp16, y = v_13_cast_fp16)[name = tensor("out_13_cast_fp16")]; tensor var_620_perm_0 = const()[name = tensor("op_620_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_29x = const()[name = tensor("concat_29x"), val = tensor([1, -1, 1024])]; tensor var_620_cast_fp16 = transpose(perm = var_620_perm_0, x = out_13_cast_fp16)[name = tensor("transpose_212")]; tensor input_85_cast_fp16 = reshape(shape = concat_29x, x = var_620_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor layers_6_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92402624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93451264))), name = tensor("layers_6_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_6_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93451840)))]; tensor linear_40_cast_fp16 = linear(bias = layers_6_self_attn_out_proj_bias_to_fp16, weight = layers_6_self_attn_out_proj_weight_to_fp16_palettized, x = input_85_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor input_87_cast_fp16 = add(x = input_81_cast_fp16, y = linear_40_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor input_89_axes_0 = const()[name = tensor("input_89_axes_0"), val = tensor([-1])]; tensor layers_6_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_6_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93453952)))]; tensor layers_6_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_6_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93456064)))]; tensor input_89_cast_fp16 = layer_norm(axes = input_89_axes_0, beta = layers_6_final_layer_norm_bias_to_fp16, epsilon = var_579_to_fp16, gamma = layers_6_final_layer_norm_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor layers_6_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93458176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97652544))), name = tensor("layers_6_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_6_fc1_bias_to_fp16 = const()[name = tensor("layers_6_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97653120)))]; tensor linear_41_cast_fp16 = linear(bias = layers_6_fc1_bias_to_fp16, weight = layers_6_fc1_weight_to_fp16_palettized, x = input_89_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor input_91_mode_0 = const()[name = tensor("input_91_mode_0"), val = tensor("EXACT")]; tensor input_91_cast_fp16 = gelu(mode = input_91_mode_0, x = linear_41_cast_fp16)[name = tensor("input_91_cast_fp16")]; tensor layers_6_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97661376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101855744))), name = tensor("layers_6_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_6_fc2_bias_to_fp16 = const()[name = tensor("layers_6_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101856320)))]; tensor linear_42_cast_fp16 = linear(bias = layers_6_fc2_bias_to_fp16, weight = layers_6_fc2_weight_to_fp16_palettized, x = input_91_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor input_93_cast_fp16 = add(x = input_87_cast_fp16, y = linear_42_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor var_646 = const()[name = tensor("op_646"), val = tensor(-1)]; tensor x_47_axes_0 = const()[name = tensor("x_47_axes_0"), val = tensor([-1])]; tensor layers_7_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_7_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101858432)))]; tensor layers_7_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101860544)))]; tensor var_649_to_fp16 = const()[name = tensor("op_649_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_47_cast_fp16 = layer_norm(axes = x_47_axes_0, beta = layers_7_self_attn_layer_norm_bias_to_fp16, epsilon = var_649_to_fp16, gamma = layers_7_self_attn_layer_norm_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor layers_7_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(101862656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102911296))), name = tensor("layers_7_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102911872)))]; tensor linear_43_cast_fp16 = linear(bias = layers_7_self_attn_q_proj_bias_to_fp16, weight = layers_7_self_attn_q_proj_weight_to_fp16_palettized, x = x_47_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor concat_30x = const()[name = tensor("concat_30x"), val = tensor([1, -1, 16, 64])]; tensor var_670_cast_fp16 = reshape(shape = concat_30x, x = linear_43_cast_fp16)[name = tensor("op_670_cast_fp16")]; tensor layers_7_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102913984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103962624))), name = tensor("layers_7_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_7_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103963200)))]; tensor linear_44_cast_fp16 = linear(bias = layers_7_self_attn_k_proj_bias_to_fp16, weight = layers_7_self_attn_k_proj_weight_to_fp16_palettized, x = x_47_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor concat_31x = const()[name = tensor("concat_31x"), val = tensor([1, -1, 16, 64])]; tensor var_676_cast_fp16 = reshape(shape = concat_31x, x = linear_44_cast_fp16)[name = tensor("op_676_cast_fp16")]; tensor layers_7_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103965312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105013952))), name = tensor("layers_7_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105014528)))]; tensor linear_45_cast_fp16 = linear(bias = layers_7_self_attn_v_proj_bias_to_fp16, weight = layers_7_self_attn_v_proj_weight_to_fp16_palettized, x = x_47_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor concat_32x = const()[name = tensor("concat_32x"), val = tensor([1, -1, 16, 64])]; tensor var_682_cast_fp16 = reshape(shape = concat_32x, x = linear_45_cast_fp16)[name = tensor("op_682_cast_fp16")]; tensor v_15_perm_0 = const()[name = tensor("v_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_685_transpose_x_0 = const()[name = tensor("op_685_transpose_x_0"), val = tensor(false)]; tensor var_685_transpose_y_0 = const()[name = tensor("op_685_transpose_y_0"), val = tensor(false)]; tensor transpose_110_perm_0 = const()[name = tensor("transpose_110_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_111_perm_0 = const()[name = tensor("transpose_111_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_111 = transpose(perm = transpose_111_perm_0, x = var_676_cast_fp16)[name = tensor("transpose_210")]; tensor transpose_110 = transpose(perm = transpose_110_perm_0, x = var_670_cast_fp16)[name = tensor("transpose_211")]; tensor var_685_cast_fp16 = matmul(transpose_x = var_685_transpose_x_0, transpose_y = var_685_transpose_y_0, x = transpose_110, y = transpose_111)[name = tensor("op_685_cast_fp16")]; tensor var_686_to_fp16 = const()[name = tensor("op_686_to_fp16"), val = tensor(0x1p-3)]; tensor input_95_cast_fp16 = mul(x = var_685_cast_fp16, y = var_686_to_fp16)[name = tensor("input_95_cast_fp16")]; tensor attn_15_cast_fp16 = softmax(axis = var_646, x = input_95_cast_fp16)[name = tensor("attn_15_cast_fp16")]; tensor out_15_transpose_x_0 = const()[name = tensor("out_15_transpose_x_0"), val = tensor(false)]; tensor out_15_transpose_y_0 = const()[name = tensor("out_15_transpose_y_0"), val = tensor(false)]; tensor v_15_cast_fp16 = transpose(perm = v_15_perm_0, x = var_682_cast_fp16)[name = tensor("transpose_209")]; tensor out_15_cast_fp16 = matmul(transpose_x = out_15_transpose_x_0, transpose_y = out_15_transpose_y_0, x = attn_15_cast_fp16, y = v_15_cast_fp16)[name = tensor("out_15_cast_fp16")]; tensor var_690_perm_0 = const()[name = tensor("op_690_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_33x = const()[name = tensor("concat_33x"), val = tensor([1, -1, 1024])]; tensor var_690_cast_fp16 = transpose(perm = var_690_perm_0, x = out_15_cast_fp16)[name = tensor("transpose_208")]; tensor input_97_cast_fp16 = reshape(shape = concat_33x, x = var_690_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor layers_7_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(105016640))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106065280))), name = tensor("layers_7_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_7_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106065856)))]; tensor linear_46_cast_fp16 = linear(bias = layers_7_self_attn_out_proj_bias_to_fp16, weight = layers_7_self_attn_out_proj_weight_to_fp16_palettized, x = input_97_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_93_cast_fp16, y = linear_46_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor input_101_axes_0 = const()[name = tensor("input_101_axes_0"), val = tensor([-1])]; tensor layers_7_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_7_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106067968)))]; tensor layers_7_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_7_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106070080)))]; tensor input_101_cast_fp16 = layer_norm(axes = input_101_axes_0, beta = layers_7_final_layer_norm_bias_to_fp16, epsilon = var_649_to_fp16, gamma = layers_7_final_layer_norm_weight_to_fp16, x = input_99_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor layers_7_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106072192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110266560))), name = tensor("layers_7_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_7_fc1_bias_to_fp16 = const()[name = tensor("layers_7_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110267136)))]; tensor linear_47_cast_fp16 = linear(bias = layers_7_fc1_bias_to_fp16, weight = layers_7_fc1_weight_to_fp16_palettized, x = input_101_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor input_103_mode_0 = const()[name = tensor("input_103_mode_0"), val = tensor("EXACT")]; tensor input_103_cast_fp16 = gelu(mode = input_103_mode_0, x = linear_47_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor layers_7_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110275392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114469760))), name = tensor("layers_7_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_7_fc2_bias_to_fp16 = const()[name = tensor("layers_7_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114470336)))]; tensor linear_48_cast_fp16 = linear(bias = layers_7_fc2_bias_to_fp16, weight = layers_7_fc2_weight_to_fp16_palettized, x = input_103_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor input_105_cast_fp16 = add(x = input_99_cast_fp16, y = linear_48_cast_fp16)[name = tensor("input_105_cast_fp16")]; tensor var_716 = const()[name = tensor("op_716"), val = tensor(-1)]; tensor x_53_axes_0 = const()[name = tensor("x_53_axes_0"), val = tensor([-1])]; tensor layers_8_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_8_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114472448)))]; tensor layers_8_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114474560)))]; tensor var_719_to_fp16 = const()[name = tensor("op_719_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_53_cast_fp16 = layer_norm(axes = x_53_axes_0, beta = layers_8_self_attn_layer_norm_bias_to_fp16, epsilon = var_719_to_fp16, gamma = layers_8_self_attn_layer_norm_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor layers_8_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114476672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115525312))), name = tensor("layers_8_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115525888)))]; tensor linear_49_cast_fp16 = linear(bias = layers_8_self_attn_q_proj_bias_to_fp16, weight = layers_8_self_attn_q_proj_weight_to_fp16_palettized, x = x_53_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor concat_34x = const()[name = tensor("concat_34x"), val = tensor([1, -1, 16, 64])]; tensor var_740_cast_fp16 = reshape(shape = concat_34x, x = linear_49_cast_fp16)[name = tensor("op_740_cast_fp16")]; tensor layers_8_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115528000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116576640))), name = tensor("layers_8_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_8_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116577216)))]; tensor linear_50_cast_fp16 = linear(bias = layers_8_self_attn_k_proj_bias_to_fp16, weight = layers_8_self_attn_k_proj_weight_to_fp16_palettized, x = x_53_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor concat_35x = const()[name = tensor("concat_35x"), val = tensor([1, -1, 16, 64])]; tensor var_746_cast_fp16 = reshape(shape = concat_35x, x = linear_50_cast_fp16)[name = tensor("op_746_cast_fp16")]; tensor layers_8_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116579328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117627968))), name = tensor("layers_8_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117628544)))]; tensor linear_51_cast_fp16 = linear(bias = layers_8_self_attn_v_proj_bias_to_fp16, weight = layers_8_self_attn_v_proj_weight_to_fp16_palettized, x = x_53_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor concat_36x = const()[name = tensor("concat_36x"), val = tensor([1, -1, 16, 64])]; tensor var_752_cast_fp16 = reshape(shape = concat_36x, x = linear_51_cast_fp16)[name = tensor("op_752_cast_fp16")]; tensor v_17_perm_0 = const()[name = tensor("v_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_755_transpose_x_0 = const()[name = tensor("op_755_transpose_x_0"), val = tensor(false)]; tensor var_755_transpose_y_0 = const()[name = tensor("op_755_transpose_y_0"), val = tensor(false)]; tensor transpose_112_perm_0 = const()[name = tensor("transpose_112_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_113_perm_0 = const()[name = tensor("transpose_113_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_113 = transpose(perm = transpose_113_perm_0, x = var_746_cast_fp16)[name = tensor("transpose_206")]; tensor transpose_112 = transpose(perm = transpose_112_perm_0, x = var_740_cast_fp16)[name = tensor("transpose_207")]; tensor var_755_cast_fp16 = matmul(transpose_x = var_755_transpose_x_0, transpose_y = var_755_transpose_y_0, x = transpose_112, y = transpose_113)[name = tensor("op_755_cast_fp16")]; tensor var_756_to_fp16 = const()[name = tensor("op_756_to_fp16"), val = tensor(0x1p-3)]; tensor input_107_cast_fp16 = mul(x = var_755_cast_fp16, y = var_756_to_fp16)[name = tensor("input_107_cast_fp16")]; tensor attn_17_cast_fp16 = softmax(axis = var_716, x = input_107_cast_fp16)[name = tensor("attn_17_cast_fp16")]; tensor out_17_transpose_x_0 = const()[name = tensor("out_17_transpose_x_0"), val = tensor(false)]; tensor out_17_transpose_y_0 = const()[name = tensor("out_17_transpose_y_0"), val = tensor(false)]; tensor v_17_cast_fp16 = transpose(perm = v_17_perm_0, x = var_752_cast_fp16)[name = tensor("transpose_205")]; tensor out_17_cast_fp16 = matmul(transpose_x = out_17_transpose_x_0, transpose_y = out_17_transpose_y_0, x = attn_17_cast_fp16, y = v_17_cast_fp16)[name = tensor("out_17_cast_fp16")]; tensor var_760_perm_0 = const()[name = tensor("op_760_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_37x = const()[name = tensor("concat_37x"), val = tensor([1, -1, 1024])]; tensor var_760_cast_fp16 = transpose(perm = var_760_perm_0, x = out_17_cast_fp16)[name = tensor("transpose_204")]; tensor input_109_cast_fp16 = reshape(shape = concat_37x, x = var_760_cast_fp16)[name = tensor("input_109_cast_fp16")]; tensor layers_8_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117630656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118679296))), name = tensor("layers_8_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_8_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118679872)))]; tensor linear_52_cast_fp16 = linear(bias = layers_8_self_attn_out_proj_bias_to_fp16, weight = layers_8_self_attn_out_proj_weight_to_fp16_palettized, x = input_109_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor input_111_cast_fp16 = add(x = input_105_cast_fp16, y = linear_52_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor input_113_axes_0 = const()[name = tensor("input_113_axes_0"), val = tensor([-1])]; tensor layers_8_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_8_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118681984)))]; tensor layers_8_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_8_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118684096)))]; tensor input_113_cast_fp16 = layer_norm(axes = input_113_axes_0, beta = layers_8_final_layer_norm_bias_to_fp16, epsilon = var_719_to_fp16, gamma = layers_8_final_layer_norm_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor layers_8_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118686208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122880576))), name = tensor("layers_8_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_8_fc1_bias_to_fp16 = const()[name = tensor("layers_8_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122881152)))]; tensor linear_53_cast_fp16 = linear(bias = layers_8_fc1_bias_to_fp16, weight = layers_8_fc1_weight_to_fp16_palettized, x = input_113_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor input_115_mode_0 = const()[name = tensor("input_115_mode_0"), val = tensor("EXACT")]; tensor input_115_cast_fp16 = gelu(mode = input_115_mode_0, x = linear_53_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor layers_8_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122889408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127083776))), name = tensor("layers_8_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_8_fc2_bias_to_fp16 = const()[name = tensor("layers_8_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127084352)))]; tensor linear_54_cast_fp16 = linear(bias = layers_8_fc2_bias_to_fp16, weight = layers_8_fc2_weight_to_fp16_palettized, x = input_115_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor input_117_cast_fp16 = add(x = input_111_cast_fp16, y = linear_54_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor var_786 = const()[name = tensor("op_786"), val = tensor(-1)]; tensor x_59_axes_0 = const()[name = tensor("x_59_axes_0"), val = tensor([-1])]; tensor layers_9_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_9_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127086464)))]; tensor layers_9_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127088576)))]; tensor var_789_to_fp16 = const()[name = tensor("op_789_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_59_cast_fp16 = layer_norm(axes = x_59_axes_0, beta = layers_9_self_attn_layer_norm_bias_to_fp16, epsilon = var_789_to_fp16, gamma = layers_9_self_attn_layer_norm_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("x_59_cast_fp16")]; tensor layers_9_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127090688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(128139328))), name = tensor("layers_9_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(128139904)))]; tensor linear_55_cast_fp16 = linear(bias = layers_9_self_attn_q_proj_bias_to_fp16, weight = layers_9_self_attn_q_proj_weight_to_fp16_palettized, x = x_59_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor concat_38x = const()[name = tensor("concat_38x"), val = tensor([1, -1, 16, 64])]; tensor var_810_cast_fp16 = reshape(shape = concat_38x, x = linear_55_cast_fp16)[name = tensor("op_810_cast_fp16")]; tensor layers_9_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(128142016))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129190656))), name = tensor("layers_9_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_9_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129191232)))]; tensor linear_56_cast_fp16 = linear(bias = layers_9_self_attn_k_proj_bias_to_fp16, weight = layers_9_self_attn_k_proj_weight_to_fp16_palettized, x = x_59_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor concat_39x = const()[name = tensor("concat_39x"), val = tensor([1, -1, 16, 64])]; tensor var_816_cast_fp16 = reshape(shape = concat_39x, x = linear_56_cast_fp16)[name = tensor("op_816_cast_fp16")]; tensor layers_9_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129193344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130241984))), name = tensor("layers_9_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130242560)))]; tensor linear_57_cast_fp16 = linear(bias = layers_9_self_attn_v_proj_bias_to_fp16, weight = layers_9_self_attn_v_proj_weight_to_fp16_palettized, x = x_59_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor concat_40x = const()[name = tensor("concat_40x"), val = tensor([1, -1, 16, 64])]; tensor var_822_cast_fp16 = reshape(shape = concat_40x, x = linear_57_cast_fp16)[name = tensor("op_822_cast_fp16")]; tensor v_19_perm_0 = const()[name = tensor("v_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_825_transpose_x_0 = const()[name = tensor("op_825_transpose_x_0"), val = tensor(false)]; tensor var_825_transpose_y_0 = const()[name = tensor("op_825_transpose_y_0"), val = tensor(false)]; tensor transpose_114_perm_0 = const()[name = tensor("transpose_114_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_115_perm_0 = const()[name = tensor("transpose_115_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_115 = transpose(perm = transpose_115_perm_0, x = var_816_cast_fp16)[name = tensor("transpose_202")]; tensor transpose_114 = transpose(perm = transpose_114_perm_0, x = var_810_cast_fp16)[name = tensor("transpose_203")]; tensor var_825_cast_fp16 = matmul(transpose_x = var_825_transpose_x_0, transpose_y = var_825_transpose_y_0, x = transpose_114, y = transpose_115)[name = tensor("op_825_cast_fp16")]; tensor var_826_to_fp16 = const()[name = tensor("op_826_to_fp16"), val = tensor(0x1p-3)]; tensor input_119_cast_fp16 = mul(x = var_825_cast_fp16, y = var_826_to_fp16)[name = tensor("input_119_cast_fp16")]; tensor attn_19_cast_fp16 = softmax(axis = var_786, x = input_119_cast_fp16)[name = tensor("attn_19_cast_fp16")]; tensor out_19_transpose_x_0 = const()[name = tensor("out_19_transpose_x_0"), val = tensor(false)]; tensor out_19_transpose_y_0 = const()[name = tensor("out_19_transpose_y_0"), val = tensor(false)]; tensor v_19_cast_fp16 = transpose(perm = v_19_perm_0, x = var_822_cast_fp16)[name = tensor("transpose_201")]; tensor out_19_cast_fp16 = matmul(transpose_x = out_19_transpose_x_0, transpose_y = out_19_transpose_y_0, x = attn_19_cast_fp16, y = v_19_cast_fp16)[name = tensor("out_19_cast_fp16")]; tensor var_830_perm_0 = const()[name = tensor("op_830_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_41x = const()[name = tensor("concat_41x"), val = tensor([1, -1, 1024])]; tensor var_830_cast_fp16 = transpose(perm = var_830_perm_0, x = out_19_cast_fp16)[name = tensor("transpose_200")]; tensor input_121_cast_fp16 = reshape(shape = concat_41x, x = var_830_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor layers_9_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130244672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131293312))), name = tensor("layers_9_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_9_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131293888)))]; tensor linear_58_cast_fp16 = linear(bias = layers_9_self_attn_out_proj_bias_to_fp16, weight = layers_9_self_attn_out_proj_weight_to_fp16_palettized, x = input_121_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor input_123_cast_fp16 = add(x = input_117_cast_fp16, y = linear_58_cast_fp16)[name = tensor("input_123_cast_fp16")]; tensor input_125_axes_0 = const()[name = tensor("input_125_axes_0"), val = tensor([-1])]; tensor layers_9_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_9_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131296000)))]; tensor layers_9_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_9_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131298112)))]; tensor input_125_cast_fp16 = layer_norm(axes = input_125_axes_0, beta = layers_9_final_layer_norm_bias_to_fp16, epsilon = var_789_to_fp16, gamma = layers_9_final_layer_norm_weight_to_fp16, x = input_123_cast_fp16)[name = tensor("input_125_cast_fp16")]; tensor layers_9_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131300224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135494592))), name = tensor("layers_9_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_9_fc1_bias_to_fp16 = const()[name = tensor("layers_9_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135495168)))]; tensor linear_59_cast_fp16 = linear(bias = layers_9_fc1_bias_to_fp16, weight = layers_9_fc1_weight_to_fp16_palettized, x = input_125_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor input_127_mode_0 = const()[name = tensor("input_127_mode_0"), val = tensor("EXACT")]; tensor input_127_cast_fp16 = gelu(mode = input_127_mode_0, x = linear_59_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor layers_9_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135503424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139697792))), name = tensor("layers_9_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_9_fc2_bias_to_fp16 = const()[name = tensor("layers_9_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139698368)))]; tensor linear_60_cast_fp16 = linear(bias = layers_9_fc2_bias_to_fp16, weight = layers_9_fc2_weight_to_fp16_palettized, x = input_127_cast_fp16)[name = tensor("linear_60_cast_fp16")]; tensor input_129_cast_fp16 = add(x = input_123_cast_fp16, y = linear_60_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor var_856 = const()[name = tensor("op_856"), val = tensor(-1)]; tensor x_65_axes_0 = const()[name = tensor("x_65_axes_0"), val = tensor([-1])]; tensor layers_10_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_10_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139700480)))]; tensor layers_10_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139702592)))]; tensor var_859_to_fp16 = const()[name = tensor("op_859_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_65_cast_fp16 = layer_norm(axes = x_65_axes_0, beta = layers_10_self_attn_layer_norm_bias_to_fp16, epsilon = var_859_to_fp16, gamma = layers_10_self_attn_layer_norm_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor layers_10_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139704704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140753344))), name = tensor("layers_10_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140753920)))]; tensor linear_61_cast_fp16 = linear(bias = layers_10_self_attn_q_proj_bias_to_fp16, weight = layers_10_self_attn_q_proj_weight_to_fp16_palettized, x = x_65_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor concat_42x = const()[name = tensor("concat_42x"), val = tensor([1, -1, 16, 64])]; tensor var_880_cast_fp16 = reshape(shape = concat_42x, x = linear_61_cast_fp16)[name = tensor("op_880_cast_fp16")]; tensor layers_10_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140756032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141804672))), name = tensor("layers_10_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_10_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141805248)))]; tensor linear_62_cast_fp16 = linear(bias = layers_10_self_attn_k_proj_bias_to_fp16, weight = layers_10_self_attn_k_proj_weight_to_fp16_palettized, x = x_65_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor concat_43x = const()[name = tensor("concat_43x"), val = tensor([1, -1, 16, 64])]; tensor var_886_cast_fp16 = reshape(shape = concat_43x, x = linear_62_cast_fp16)[name = tensor("op_886_cast_fp16")]; tensor layers_10_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141807360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142856000))), name = tensor("layers_10_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142856576)))]; tensor linear_63_cast_fp16 = linear(bias = layers_10_self_attn_v_proj_bias_to_fp16, weight = layers_10_self_attn_v_proj_weight_to_fp16_palettized, x = x_65_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor concat_44x = const()[name = tensor("concat_44x"), val = tensor([1, -1, 16, 64])]; tensor var_892_cast_fp16 = reshape(shape = concat_44x, x = linear_63_cast_fp16)[name = tensor("op_892_cast_fp16")]; tensor v_21_perm_0 = const()[name = tensor("v_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_895_transpose_x_0 = const()[name = tensor("op_895_transpose_x_0"), val = tensor(false)]; tensor var_895_transpose_y_0 = const()[name = tensor("op_895_transpose_y_0"), val = tensor(false)]; tensor transpose_116_perm_0 = const()[name = tensor("transpose_116_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_117_perm_0 = const()[name = tensor("transpose_117_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_117 = transpose(perm = transpose_117_perm_0, x = var_886_cast_fp16)[name = tensor("transpose_198")]; tensor transpose_116 = transpose(perm = transpose_116_perm_0, x = var_880_cast_fp16)[name = tensor("transpose_199")]; tensor var_895_cast_fp16 = matmul(transpose_x = var_895_transpose_x_0, transpose_y = var_895_transpose_y_0, x = transpose_116, y = transpose_117)[name = tensor("op_895_cast_fp16")]; tensor var_896_to_fp16 = const()[name = tensor("op_896_to_fp16"), val = tensor(0x1p-3)]; tensor input_131_cast_fp16 = mul(x = var_895_cast_fp16, y = var_896_to_fp16)[name = tensor("input_131_cast_fp16")]; tensor attn_21_cast_fp16 = softmax(axis = var_856, x = input_131_cast_fp16)[name = tensor("attn_21_cast_fp16")]; tensor out_21_transpose_x_0 = const()[name = tensor("out_21_transpose_x_0"), val = tensor(false)]; tensor out_21_transpose_y_0 = const()[name = tensor("out_21_transpose_y_0"), val = tensor(false)]; tensor v_21_cast_fp16 = transpose(perm = v_21_perm_0, x = var_892_cast_fp16)[name = tensor("transpose_197")]; tensor out_21_cast_fp16 = matmul(transpose_x = out_21_transpose_x_0, transpose_y = out_21_transpose_y_0, x = attn_21_cast_fp16, y = v_21_cast_fp16)[name = tensor("out_21_cast_fp16")]; tensor var_900_perm_0 = const()[name = tensor("op_900_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_45x = const()[name = tensor("concat_45x"), val = tensor([1, -1, 1024])]; tensor var_900_cast_fp16 = transpose(perm = var_900_perm_0, x = out_21_cast_fp16)[name = tensor("transpose_196")]; tensor input_133_cast_fp16 = reshape(shape = concat_45x, x = var_900_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor layers_10_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142858688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143907328))), name = tensor("layers_10_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_10_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143907904)))]; tensor linear_64_cast_fp16 = linear(bias = layers_10_self_attn_out_proj_bias_to_fp16, weight = layers_10_self_attn_out_proj_weight_to_fp16_palettized, x = input_133_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor input_135_cast_fp16 = add(x = input_129_cast_fp16, y = linear_64_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor input_137_axes_0 = const()[name = tensor("input_137_axes_0"), val = tensor([-1])]; tensor layers_10_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_10_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143910016)))]; tensor layers_10_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_10_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143912128)))]; tensor input_137_cast_fp16 = layer_norm(axes = input_137_axes_0, beta = layers_10_final_layer_norm_bias_to_fp16, epsilon = var_859_to_fp16, gamma = layers_10_final_layer_norm_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("input_137_cast_fp16")]; tensor layers_10_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143914240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148108608))), name = tensor("layers_10_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_10_fc1_bias_to_fp16 = const()[name = tensor("layers_10_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148109184)))]; tensor linear_65_cast_fp16 = linear(bias = layers_10_fc1_bias_to_fp16, weight = layers_10_fc1_weight_to_fp16_palettized, x = input_137_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor input_139_mode_0 = const()[name = tensor("input_139_mode_0"), val = tensor("EXACT")]; tensor input_139_cast_fp16 = gelu(mode = input_139_mode_0, x = linear_65_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor layers_10_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148117440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152311808))), name = tensor("layers_10_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_10_fc2_bias_to_fp16 = const()[name = tensor("layers_10_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152312384)))]; tensor linear_66_cast_fp16 = linear(bias = layers_10_fc2_bias_to_fp16, weight = layers_10_fc2_weight_to_fp16_palettized, x = input_139_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor input_141_cast_fp16 = add(x = input_135_cast_fp16, y = linear_66_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor var_926 = const()[name = tensor("op_926"), val = tensor(-1)]; tensor x_71_axes_0 = const()[name = tensor("x_71_axes_0"), val = tensor([-1])]; tensor layers_11_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_11_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152314496)))]; tensor layers_11_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152316608)))]; tensor var_929_to_fp16 = const()[name = tensor("op_929_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_71_cast_fp16 = layer_norm(axes = x_71_axes_0, beta = layers_11_self_attn_layer_norm_bias_to_fp16, epsilon = var_929_to_fp16, gamma = layers_11_self_attn_layer_norm_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("x_71_cast_fp16")]; tensor layers_11_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152318720))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153367360))), name = tensor("layers_11_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153367936)))]; tensor linear_67_cast_fp16 = linear(bias = layers_11_self_attn_q_proj_bias_to_fp16, weight = layers_11_self_attn_q_proj_weight_to_fp16_palettized, x = x_71_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor concat_46x = const()[name = tensor("concat_46x"), val = tensor([1, -1, 16, 64])]; tensor var_950_cast_fp16 = reshape(shape = concat_46x, x = linear_67_cast_fp16)[name = tensor("op_950_cast_fp16")]; tensor layers_11_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153370048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154418688))), name = tensor("layers_11_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_11_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154419264)))]; tensor linear_68_cast_fp16 = linear(bias = layers_11_self_attn_k_proj_bias_to_fp16, weight = layers_11_self_attn_k_proj_weight_to_fp16_palettized, x = x_71_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor concat_47x = const()[name = tensor("concat_47x"), val = tensor([1, -1, 16, 64])]; tensor var_956_cast_fp16 = reshape(shape = concat_47x, x = linear_68_cast_fp16)[name = tensor("op_956_cast_fp16")]; tensor layers_11_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154421376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155470016))), name = tensor("layers_11_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155470592)))]; tensor linear_69_cast_fp16 = linear(bias = layers_11_self_attn_v_proj_bias_to_fp16, weight = layers_11_self_attn_v_proj_weight_to_fp16_palettized, x = x_71_cast_fp16)[name = tensor("linear_69_cast_fp16")]; tensor concat_48x = const()[name = tensor("concat_48x"), val = tensor([1, -1, 16, 64])]; tensor var_962_cast_fp16 = reshape(shape = concat_48x, x = linear_69_cast_fp16)[name = tensor("op_962_cast_fp16")]; tensor v_23_perm_0 = const()[name = tensor("v_23_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_965_transpose_x_0 = const()[name = tensor("op_965_transpose_x_0"), val = tensor(false)]; tensor var_965_transpose_y_0 = const()[name = tensor("op_965_transpose_y_0"), val = tensor(false)]; tensor transpose_118_perm_0 = const()[name = tensor("transpose_118_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_119_perm_0 = const()[name = tensor("transpose_119_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_119 = transpose(perm = transpose_119_perm_0, x = var_956_cast_fp16)[name = tensor("transpose_194")]; tensor transpose_118 = transpose(perm = transpose_118_perm_0, x = var_950_cast_fp16)[name = tensor("transpose_195")]; tensor var_965_cast_fp16 = matmul(transpose_x = var_965_transpose_x_0, transpose_y = var_965_transpose_y_0, x = transpose_118, y = transpose_119)[name = tensor("op_965_cast_fp16")]; tensor var_966_to_fp16 = const()[name = tensor("op_966_to_fp16"), val = tensor(0x1p-3)]; tensor input_143_cast_fp16 = mul(x = var_965_cast_fp16, y = var_966_to_fp16)[name = tensor("input_143_cast_fp16")]; tensor attn_23_cast_fp16 = softmax(axis = var_926, x = input_143_cast_fp16)[name = tensor("attn_23_cast_fp16")]; tensor out_23_transpose_x_0 = const()[name = tensor("out_23_transpose_x_0"), val = tensor(false)]; tensor out_23_transpose_y_0 = const()[name = tensor("out_23_transpose_y_0"), val = tensor(false)]; tensor v_23_cast_fp16 = transpose(perm = v_23_perm_0, x = var_962_cast_fp16)[name = tensor("transpose_193")]; tensor out_23_cast_fp16 = matmul(transpose_x = out_23_transpose_x_0, transpose_y = out_23_transpose_y_0, x = attn_23_cast_fp16, y = v_23_cast_fp16)[name = tensor("out_23_cast_fp16")]; tensor var_970_perm_0 = const()[name = tensor("op_970_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_49x = const()[name = tensor("concat_49x"), val = tensor([1, -1, 1024])]; tensor var_970_cast_fp16 = transpose(perm = var_970_perm_0, x = out_23_cast_fp16)[name = tensor("transpose_192")]; tensor input_145_cast_fp16 = reshape(shape = concat_49x, x = var_970_cast_fp16)[name = tensor("input_145_cast_fp16")]; tensor layers_11_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155472704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156521344))), name = tensor("layers_11_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_11_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156521920)))]; tensor linear_70_cast_fp16 = linear(bias = layers_11_self_attn_out_proj_bias_to_fp16, weight = layers_11_self_attn_out_proj_weight_to_fp16_palettized, x = input_145_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor input_147_cast_fp16 = add(x = input_141_cast_fp16, y = linear_70_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor input_149_axes_0 = const()[name = tensor("input_149_axes_0"), val = tensor([-1])]; tensor layers_11_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_11_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156524032)))]; tensor layers_11_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_11_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156526144)))]; tensor input_149_cast_fp16 = layer_norm(axes = input_149_axes_0, beta = layers_11_final_layer_norm_bias_to_fp16, epsilon = var_929_to_fp16, gamma = layers_11_final_layer_norm_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor layers_11_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156528256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160722624))), name = tensor("layers_11_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_11_fc1_bias_to_fp16 = const()[name = tensor("layers_11_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160723200)))]; tensor linear_71_cast_fp16 = linear(bias = layers_11_fc1_bias_to_fp16, weight = layers_11_fc1_weight_to_fp16_palettized, x = input_149_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor input_151_mode_0 = const()[name = tensor("input_151_mode_0"), val = tensor("EXACT")]; tensor input_151_cast_fp16 = gelu(mode = input_151_mode_0, x = linear_71_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor layers_11_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(160731456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164925824))), name = tensor("layers_11_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_11_fc2_bias_to_fp16 = const()[name = tensor("layers_11_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164926400)))]; tensor linear_72_cast_fp16 = linear(bias = layers_11_fc2_bias_to_fp16, weight = layers_11_fc2_weight_to_fp16_palettized, x = input_151_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor input_153_cast_fp16 = add(x = input_147_cast_fp16, y = linear_72_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor var_996 = const()[name = tensor("op_996"), val = tensor(-1)]; tensor x_77_axes_0 = const()[name = tensor("x_77_axes_0"), val = tensor([-1])]; tensor layers_12_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_12_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164928512)))]; tensor layers_12_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164930624)))]; tensor var_999_to_fp16 = const()[name = tensor("op_999_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_77_cast_fp16 = layer_norm(axes = x_77_axes_0, beta = layers_12_self_attn_layer_norm_bias_to_fp16, epsilon = var_999_to_fp16, gamma = layers_12_self_attn_layer_norm_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor layers_12_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164932736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165981376))), name = tensor("layers_12_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_12_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165981952)))]; tensor linear_73_cast_fp16 = linear(bias = layers_12_self_attn_q_proj_bias_to_fp16, weight = layers_12_self_attn_q_proj_weight_to_fp16_palettized, x = x_77_cast_fp16)[name = tensor("linear_73_cast_fp16")]; tensor concat_50x = const()[name = tensor("concat_50x"), val = tensor([1, -1, 16, 64])]; tensor var_1020_cast_fp16 = reshape(shape = concat_50x, x = linear_73_cast_fp16)[name = tensor("op_1020_cast_fp16")]; tensor layers_12_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165984064))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167032704))), name = tensor("layers_12_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_12_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167033280)))]; tensor linear_74_cast_fp16 = linear(bias = layers_12_self_attn_k_proj_bias_to_fp16, weight = layers_12_self_attn_k_proj_weight_to_fp16_palettized, x = x_77_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor concat_51x = const()[name = tensor("concat_51x"), val = tensor([1, -1, 16, 64])]; tensor var_1026_cast_fp16 = reshape(shape = concat_51x, x = linear_74_cast_fp16)[name = tensor("op_1026_cast_fp16")]; tensor layers_12_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167035392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(168084032))), name = tensor("layers_12_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_12_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(168084608)))]; tensor linear_75_cast_fp16 = linear(bias = layers_12_self_attn_v_proj_bias_to_fp16, weight = layers_12_self_attn_v_proj_weight_to_fp16_palettized, x = x_77_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor concat_52x = const()[name = tensor("concat_52x"), val = tensor([1, -1, 16, 64])]; tensor var_1032_cast_fp16 = reshape(shape = concat_52x, x = linear_75_cast_fp16)[name = tensor("op_1032_cast_fp16")]; tensor v_25_perm_0 = const()[name = tensor("v_25_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1035_transpose_x_0 = const()[name = tensor("op_1035_transpose_x_0"), val = tensor(false)]; tensor var_1035_transpose_y_0 = const()[name = tensor("op_1035_transpose_y_0"), val = tensor(false)]; tensor transpose_120_perm_0 = const()[name = tensor("transpose_120_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_121_perm_0 = const()[name = tensor("transpose_121_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_121 = transpose(perm = transpose_121_perm_0, x = var_1026_cast_fp16)[name = tensor("transpose_190")]; tensor transpose_120 = transpose(perm = transpose_120_perm_0, x = var_1020_cast_fp16)[name = tensor("transpose_191")]; tensor var_1035_cast_fp16 = matmul(transpose_x = var_1035_transpose_x_0, transpose_y = var_1035_transpose_y_0, x = transpose_120, y = transpose_121)[name = tensor("op_1035_cast_fp16")]; tensor var_1036_to_fp16 = const()[name = tensor("op_1036_to_fp16"), val = tensor(0x1p-3)]; tensor input_155_cast_fp16 = mul(x = var_1035_cast_fp16, y = var_1036_to_fp16)[name = tensor("input_155_cast_fp16")]; tensor attn_25_cast_fp16 = softmax(axis = var_996, x = input_155_cast_fp16)[name = tensor("attn_25_cast_fp16")]; tensor out_25_transpose_x_0 = const()[name = tensor("out_25_transpose_x_0"), val = tensor(false)]; tensor out_25_transpose_y_0 = const()[name = tensor("out_25_transpose_y_0"), val = tensor(false)]; tensor v_25_cast_fp16 = transpose(perm = v_25_perm_0, x = var_1032_cast_fp16)[name = tensor("transpose_189")]; tensor out_25_cast_fp16 = matmul(transpose_x = out_25_transpose_x_0, transpose_y = out_25_transpose_y_0, x = attn_25_cast_fp16, y = v_25_cast_fp16)[name = tensor("out_25_cast_fp16")]; tensor var_1040_perm_0 = const()[name = tensor("op_1040_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_53x = const()[name = tensor("concat_53x"), val = tensor([1, -1, 1024])]; tensor var_1040_cast_fp16 = transpose(perm = var_1040_perm_0, x = out_25_cast_fp16)[name = tensor("transpose_188")]; tensor input_157_cast_fp16 = reshape(shape = concat_53x, x = var_1040_cast_fp16)[name = tensor("input_157_cast_fp16")]; tensor layers_12_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(168086720))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169135360))), name = tensor("layers_12_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_12_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169135936)))]; tensor linear_76_cast_fp16 = linear(bias = layers_12_self_attn_out_proj_bias_to_fp16, weight = layers_12_self_attn_out_proj_weight_to_fp16_palettized, x = input_157_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor input_159_cast_fp16 = add(x = input_153_cast_fp16, y = linear_76_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor input_161_axes_0 = const()[name = tensor("input_161_axes_0"), val = tensor([-1])]; tensor layers_12_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_12_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169138048)))]; tensor layers_12_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_12_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169140160)))]; tensor input_161_cast_fp16 = layer_norm(axes = input_161_axes_0, beta = layers_12_final_layer_norm_bias_to_fp16, epsilon = var_999_to_fp16, gamma = layers_12_final_layer_norm_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor layers_12_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169142272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173336640))), name = tensor("layers_12_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_12_fc1_bias_to_fp16 = const()[name = tensor("layers_12_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173337216)))]; tensor linear_77_cast_fp16 = linear(bias = layers_12_fc1_bias_to_fp16, weight = layers_12_fc1_weight_to_fp16_palettized, x = input_161_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor input_163_mode_0 = const()[name = tensor("input_163_mode_0"), val = tensor("EXACT")]; tensor input_163_cast_fp16 = gelu(mode = input_163_mode_0, x = linear_77_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor layers_12_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173345472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177539840))), name = tensor("layers_12_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_12_fc2_bias_to_fp16 = const()[name = tensor("layers_12_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177540416)))]; tensor linear_78_cast_fp16 = linear(bias = layers_12_fc2_bias_to_fp16, weight = layers_12_fc2_weight_to_fp16_palettized, x = input_163_cast_fp16)[name = tensor("linear_78_cast_fp16")]; tensor input_165_cast_fp16 = add(x = input_159_cast_fp16, y = linear_78_cast_fp16)[name = tensor("input_165_cast_fp16")]; tensor var_1066 = const()[name = tensor("op_1066"), val = tensor(-1)]; tensor x_83_axes_0 = const()[name = tensor("x_83_axes_0"), val = tensor([-1])]; tensor layers_13_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_13_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177542528)))]; tensor layers_13_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177544640)))]; tensor var_1069_to_fp16 = const()[name = tensor("op_1069_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_83_cast_fp16 = layer_norm(axes = x_83_axes_0, beta = layers_13_self_attn_layer_norm_bias_to_fp16, epsilon = var_1069_to_fp16, gamma = layers_13_self_attn_layer_norm_weight_to_fp16, x = input_165_cast_fp16)[name = tensor("x_83_cast_fp16")]; tensor layers_13_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177546752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178595392))), name = tensor("layers_13_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_13_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178595968)))]; tensor linear_79_cast_fp16 = linear(bias = layers_13_self_attn_q_proj_bias_to_fp16, weight = layers_13_self_attn_q_proj_weight_to_fp16_palettized, x = x_83_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor concat_54x = const()[name = tensor("concat_54x"), val = tensor([1, -1, 16, 64])]; tensor var_1090_cast_fp16 = reshape(shape = concat_54x, x = linear_79_cast_fp16)[name = tensor("op_1090_cast_fp16")]; tensor layers_13_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178598080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179646720))), name = tensor("layers_13_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_13_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179647296)))]; tensor linear_80_cast_fp16 = linear(bias = layers_13_self_attn_k_proj_bias_to_fp16, weight = layers_13_self_attn_k_proj_weight_to_fp16_palettized, x = x_83_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor concat_55x = const()[name = tensor("concat_55x"), val = tensor([1, -1, 16, 64])]; tensor var_1096_cast_fp16 = reshape(shape = concat_55x, x = linear_80_cast_fp16)[name = tensor("op_1096_cast_fp16")]; tensor layers_13_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179649408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180698048))), name = tensor("layers_13_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_13_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180698624)))]; tensor linear_81_cast_fp16 = linear(bias = layers_13_self_attn_v_proj_bias_to_fp16, weight = layers_13_self_attn_v_proj_weight_to_fp16_palettized, x = x_83_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor concat_56x = const()[name = tensor("concat_56x"), val = tensor([1, -1, 16, 64])]; tensor var_1102_cast_fp16 = reshape(shape = concat_56x, x = linear_81_cast_fp16)[name = tensor("op_1102_cast_fp16")]; tensor v_27_perm_0 = const()[name = tensor("v_27_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1105_transpose_x_0 = const()[name = tensor("op_1105_transpose_x_0"), val = tensor(false)]; tensor var_1105_transpose_y_0 = const()[name = tensor("op_1105_transpose_y_0"), val = tensor(false)]; tensor transpose_122_perm_0 = const()[name = tensor("transpose_122_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_123_perm_0 = const()[name = tensor("transpose_123_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_123 = transpose(perm = transpose_123_perm_0, x = var_1096_cast_fp16)[name = tensor("transpose_186")]; tensor transpose_122 = transpose(perm = transpose_122_perm_0, x = var_1090_cast_fp16)[name = tensor("transpose_187")]; tensor var_1105_cast_fp16 = matmul(transpose_x = var_1105_transpose_x_0, transpose_y = var_1105_transpose_y_0, x = transpose_122, y = transpose_123)[name = tensor("op_1105_cast_fp16")]; tensor var_1106_to_fp16 = const()[name = tensor("op_1106_to_fp16"), val = tensor(0x1p-3)]; tensor input_167_cast_fp16 = mul(x = var_1105_cast_fp16, y = var_1106_to_fp16)[name = tensor("input_167_cast_fp16")]; tensor attn_27_cast_fp16 = softmax(axis = var_1066, x = input_167_cast_fp16)[name = tensor("attn_27_cast_fp16")]; tensor out_27_transpose_x_0 = const()[name = tensor("out_27_transpose_x_0"), val = tensor(false)]; tensor out_27_transpose_y_0 = const()[name = tensor("out_27_transpose_y_0"), val = tensor(false)]; tensor v_27_cast_fp16 = transpose(perm = v_27_perm_0, x = var_1102_cast_fp16)[name = tensor("transpose_185")]; tensor out_27_cast_fp16 = matmul(transpose_x = out_27_transpose_x_0, transpose_y = out_27_transpose_y_0, x = attn_27_cast_fp16, y = v_27_cast_fp16)[name = tensor("out_27_cast_fp16")]; tensor var_1110_perm_0 = const()[name = tensor("op_1110_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_57x = const()[name = tensor("concat_57x"), val = tensor([1, -1, 1024])]; tensor var_1110_cast_fp16 = transpose(perm = var_1110_perm_0, x = out_27_cast_fp16)[name = tensor("transpose_184")]; tensor input_169_cast_fp16 = reshape(shape = concat_57x, x = var_1110_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor layers_13_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180700736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181749376))), name = tensor("layers_13_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_13_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181749952)))]; tensor linear_82_cast_fp16 = linear(bias = layers_13_self_attn_out_proj_bias_to_fp16, weight = layers_13_self_attn_out_proj_weight_to_fp16_palettized, x = input_169_cast_fp16)[name = tensor("linear_82_cast_fp16")]; tensor input_171_cast_fp16 = add(x = input_165_cast_fp16, y = linear_82_cast_fp16)[name = tensor("input_171_cast_fp16")]; tensor input_173_axes_0 = const()[name = tensor("input_173_axes_0"), val = tensor([-1])]; tensor layers_13_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_13_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181752064)))]; tensor layers_13_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_13_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181754176)))]; tensor input_173_cast_fp16 = layer_norm(axes = input_173_axes_0, beta = layers_13_final_layer_norm_bias_to_fp16, epsilon = var_1069_to_fp16, gamma = layers_13_final_layer_norm_weight_to_fp16, x = input_171_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor layers_13_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181756288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185950656))), name = tensor("layers_13_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_13_fc1_bias_to_fp16 = const()[name = tensor("layers_13_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185951232)))]; tensor linear_83_cast_fp16 = linear(bias = layers_13_fc1_bias_to_fp16, weight = layers_13_fc1_weight_to_fp16_palettized, x = input_173_cast_fp16)[name = tensor("linear_83_cast_fp16")]; tensor input_175_mode_0 = const()[name = tensor("input_175_mode_0"), val = tensor("EXACT")]; tensor input_175_cast_fp16 = gelu(mode = input_175_mode_0, x = linear_83_cast_fp16)[name = tensor("input_175_cast_fp16")]; tensor layers_13_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185959488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190153856))), name = tensor("layers_13_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_13_fc2_bias_to_fp16 = const()[name = tensor("layers_13_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190154432)))]; tensor linear_84_cast_fp16 = linear(bias = layers_13_fc2_bias_to_fp16, weight = layers_13_fc2_weight_to_fp16_palettized, x = input_175_cast_fp16)[name = tensor("linear_84_cast_fp16")]; tensor input_177_cast_fp16 = add(x = input_171_cast_fp16, y = linear_84_cast_fp16)[name = tensor("input_177_cast_fp16")]; tensor var_1136 = const()[name = tensor("op_1136"), val = tensor(-1)]; tensor x_89_axes_0 = const()[name = tensor("x_89_axes_0"), val = tensor([-1])]; tensor layers_14_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_14_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190156544)))]; tensor layers_14_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190158656)))]; tensor var_1139_to_fp16 = const()[name = tensor("op_1139_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_89_cast_fp16 = layer_norm(axes = x_89_axes_0, beta = layers_14_self_attn_layer_norm_bias_to_fp16, epsilon = var_1139_to_fp16, gamma = layers_14_self_attn_layer_norm_weight_to_fp16, x = input_177_cast_fp16)[name = tensor("x_89_cast_fp16")]; tensor layers_14_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190160768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(191209408))), name = tensor("layers_14_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_14_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(191209984)))]; tensor linear_85_cast_fp16 = linear(bias = layers_14_self_attn_q_proj_bias_to_fp16, weight = layers_14_self_attn_q_proj_weight_to_fp16_palettized, x = x_89_cast_fp16)[name = tensor("linear_85_cast_fp16")]; tensor concat_58x = const()[name = tensor("concat_58x"), val = tensor([1, -1, 16, 64])]; tensor var_1160_cast_fp16 = reshape(shape = concat_58x, x = linear_85_cast_fp16)[name = tensor("op_1160_cast_fp16")]; tensor layers_14_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(191212096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192260736))), name = tensor("layers_14_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_14_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192261312)))]; tensor linear_86_cast_fp16 = linear(bias = layers_14_self_attn_k_proj_bias_to_fp16, weight = layers_14_self_attn_k_proj_weight_to_fp16_palettized, x = x_89_cast_fp16)[name = tensor("linear_86_cast_fp16")]; tensor concat_59x = const()[name = tensor("concat_59x"), val = tensor([1, -1, 16, 64])]; tensor var_1166_cast_fp16 = reshape(shape = concat_59x, x = linear_86_cast_fp16)[name = tensor("op_1166_cast_fp16")]; tensor layers_14_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192263424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193312064))), name = tensor("layers_14_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_14_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193312640)))]; tensor linear_87_cast_fp16 = linear(bias = layers_14_self_attn_v_proj_bias_to_fp16, weight = layers_14_self_attn_v_proj_weight_to_fp16_palettized, x = x_89_cast_fp16)[name = tensor("linear_87_cast_fp16")]; tensor concat_60x = const()[name = tensor("concat_60x"), val = tensor([1, -1, 16, 64])]; tensor var_1172_cast_fp16 = reshape(shape = concat_60x, x = linear_87_cast_fp16)[name = tensor("op_1172_cast_fp16")]; tensor v_29_perm_0 = const()[name = tensor("v_29_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1175_transpose_x_0 = const()[name = tensor("op_1175_transpose_x_0"), val = tensor(false)]; tensor var_1175_transpose_y_0 = const()[name = tensor("op_1175_transpose_y_0"), val = tensor(false)]; tensor transpose_124_perm_0 = const()[name = tensor("transpose_124_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_125_perm_0 = const()[name = tensor("transpose_125_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_125 = transpose(perm = transpose_125_perm_0, x = var_1166_cast_fp16)[name = tensor("transpose_182")]; tensor transpose_124 = transpose(perm = transpose_124_perm_0, x = var_1160_cast_fp16)[name = tensor("transpose_183")]; tensor var_1175_cast_fp16 = matmul(transpose_x = var_1175_transpose_x_0, transpose_y = var_1175_transpose_y_0, x = transpose_124, y = transpose_125)[name = tensor("op_1175_cast_fp16")]; tensor var_1176_to_fp16 = const()[name = tensor("op_1176_to_fp16"), val = tensor(0x1p-3)]; tensor input_179_cast_fp16 = mul(x = var_1175_cast_fp16, y = var_1176_to_fp16)[name = tensor("input_179_cast_fp16")]; tensor attn_29_cast_fp16 = softmax(axis = var_1136, x = input_179_cast_fp16)[name = tensor("attn_29_cast_fp16")]; tensor out_29_transpose_x_0 = const()[name = tensor("out_29_transpose_x_0"), val = tensor(false)]; tensor out_29_transpose_y_0 = const()[name = tensor("out_29_transpose_y_0"), val = tensor(false)]; tensor v_29_cast_fp16 = transpose(perm = v_29_perm_0, x = var_1172_cast_fp16)[name = tensor("transpose_181")]; tensor out_29_cast_fp16 = matmul(transpose_x = out_29_transpose_x_0, transpose_y = out_29_transpose_y_0, x = attn_29_cast_fp16, y = v_29_cast_fp16)[name = tensor("out_29_cast_fp16")]; tensor var_1180_perm_0 = const()[name = tensor("op_1180_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_61x = const()[name = tensor("concat_61x"), val = tensor([1, -1, 1024])]; tensor var_1180_cast_fp16 = transpose(perm = var_1180_perm_0, x = out_29_cast_fp16)[name = tensor("transpose_180")]; tensor input_181_cast_fp16 = reshape(shape = concat_61x, x = var_1180_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor layers_14_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193314752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194363392))), name = tensor("layers_14_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_14_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194363968)))]; tensor linear_88_cast_fp16 = linear(bias = layers_14_self_attn_out_proj_bias_to_fp16, weight = layers_14_self_attn_out_proj_weight_to_fp16_palettized, x = input_181_cast_fp16)[name = tensor("linear_88_cast_fp16")]; tensor input_183_cast_fp16 = add(x = input_177_cast_fp16, y = linear_88_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor input_185_axes_0 = const()[name = tensor("input_185_axes_0"), val = tensor([-1])]; tensor layers_14_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_14_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194366080)))]; tensor layers_14_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_14_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194368192)))]; tensor input_185_cast_fp16 = layer_norm(axes = input_185_axes_0, beta = layers_14_final_layer_norm_bias_to_fp16, epsilon = var_1139_to_fp16, gamma = layers_14_final_layer_norm_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("input_185_cast_fp16")]; tensor layers_14_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194370304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198564672))), name = tensor("layers_14_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_14_fc1_bias_to_fp16 = const()[name = tensor("layers_14_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198565248)))]; tensor linear_89_cast_fp16 = linear(bias = layers_14_fc1_bias_to_fp16, weight = layers_14_fc1_weight_to_fp16_palettized, x = input_185_cast_fp16)[name = tensor("linear_89_cast_fp16")]; tensor input_187_mode_0 = const()[name = tensor("input_187_mode_0"), val = tensor("EXACT")]; tensor input_187_cast_fp16 = gelu(mode = input_187_mode_0, x = linear_89_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor layers_14_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198573504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202767872))), name = tensor("layers_14_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_14_fc2_bias_to_fp16 = const()[name = tensor("layers_14_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202768448)))]; tensor linear_90_cast_fp16 = linear(bias = layers_14_fc2_bias_to_fp16, weight = layers_14_fc2_weight_to_fp16_palettized, x = input_187_cast_fp16)[name = tensor("linear_90_cast_fp16")]; tensor input_189_cast_fp16 = add(x = input_183_cast_fp16, y = linear_90_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor var_1206 = const()[name = tensor("op_1206"), val = tensor(-1)]; tensor x_95_axes_0 = const()[name = tensor("x_95_axes_0"), val = tensor([-1])]; tensor layers_15_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_15_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202770560)))]; tensor layers_15_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202772672)))]; tensor var_1209_to_fp16 = const()[name = tensor("op_1209_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_95_cast_fp16 = layer_norm(axes = x_95_axes_0, beta = layers_15_self_attn_layer_norm_bias_to_fp16, epsilon = var_1209_to_fp16, gamma = layers_15_self_attn_layer_norm_weight_to_fp16, x = input_189_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor layers_15_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202774784))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203823424))), name = tensor("layers_15_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_15_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203824000)))]; tensor linear_91_cast_fp16 = linear(bias = layers_15_self_attn_q_proj_bias_to_fp16, weight = layers_15_self_attn_q_proj_weight_to_fp16_palettized, x = x_95_cast_fp16)[name = tensor("linear_91_cast_fp16")]; tensor concat_62x = const()[name = tensor("concat_62x"), val = tensor([1, -1, 16, 64])]; tensor var_1230_cast_fp16 = reshape(shape = concat_62x, x = linear_91_cast_fp16)[name = tensor("op_1230_cast_fp16")]; tensor layers_15_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203826112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204874752))), name = tensor("layers_15_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_15_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204875328)))]; tensor linear_92_cast_fp16 = linear(bias = layers_15_self_attn_k_proj_bias_to_fp16, weight = layers_15_self_attn_k_proj_weight_to_fp16_palettized, x = x_95_cast_fp16)[name = tensor("linear_92_cast_fp16")]; tensor concat_63x = const()[name = tensor("concat_63x"), val = tensor([1, -1, 16, 64])]; tensor var_1236_cast_fp16 = reshape(shape = concat_63x, x = linear_92_cast_fp16)[name = tensor("op_1236_cast_fp16")]; tensor layers_15_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204877440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205926080))), name = tensor("layers_15_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_15_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205926656)))]; tensor linear_93_cast_fp16 = linear(bias = layers_15_self_attn_v_proj_bias_to_fp16, weight = layers_15_self_attn_v_proj_weight_to_fp16_palettized, x = x_95_cast_fp16)[name = tensor("linear_93_cast_fp16")]; tensor concat_64x = const()[name = tensor("concat_64x"), val = tensor([1, -1, 16, 64])]; tensor var_1242_cast_fp16 = reshape(shape = concat_64x, x = linear_93_cast_fp16)[name = tensor("op_1242_cast_fp16")]; tensor v_31_perm_0 = const()[name = tensor("v_31_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1245_transpose_x_0 = const()[name = tensor("op_1245_transpose_x_0"), val = tensor(false)]; tensor var_1245_transpose_y_0 = const()[name = tensor("op_1245_transpose_y_0"), val = tensor(false)]; tensor transpose_126_perm_0 = const()[name = tensor("transpose_126_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_127_perm_0 = const()[name = tensor("transpose_127_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_127 = transpose(perm = transpose_127_perm_0, x = var_1236_cast_fp16)[name = tensor("transpose_178")]; tensor transpose_126 = transpose(perm = transpose_126_perm_0, x = var_1230_cast_fp16)[name = tensor("transpose_179")]; tensor var_1245_cast_fp16 = matmul(transpose_x = var_1245_transpose_x_0, transpose_y = var_1245_transpose_y_0, x = transpose_126, y = transpose_127)[name = tensor("op_1245_cast_fp16")]; tensor var_1246_to_fp16 = const()[name = tensor("op_1246_to_fp16"), val = tensor(0x1p-3)]; tensor input_191_cast_fp16 = mul(x = var_1245_cast_fp16, y = var_1246_to_fp16)[name = tensor("input_191_cast_fp16")]; tensor attn_31_cast_fp16 = softmax(axis = var_1206, x = input_191_cast_fp16)[name = tensor("attn_31_cast_fp16")]; tensor out_31_transpose_x_0 = const()[name = tensor("out_31_transpose_x_0"), val = tensor(false)]; tensor out_31_transpose_y_0 = const()[name = tensor("out_31_transpose_y_0"), val = tensor(false)]; tensor v_31_cast_fp16 = transpose(perm = v_31_perm_0, x = var_1242_cast_fp16)[name = tensor("transpose_177")]; tensor out_31_cast_fp16 = matmul(transpose_x = out_31_transpose_x_0, transpose_y = out_31_transpose_y_0, x = attn_31_cast_fp16, y = v_31_cast_fp16)[name = tensor("out_31_cast_fp16")]; tensor var_1250_perm_0 = const()[name = tensor("op_1250_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_65x = const()[name = tensor("concat_65x"), val = tensor([1, -1, 1024])]; tensor var_1250_cast_fp16 = transpose(perm = var_1250_perm_0, x = out_31_cast_fp16)[name = tensor("transpose_176")]; tensor input_193_cast_fp16 = reshape(shape = concat_65x, x = var_1250_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor layers_15_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205928768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206977408))), name = tensor("layers_15_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_15_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206977984)))]; tensor linear_94_cast_fp16 = linear(bias = layers_15_self_attn_out_proj_bias_to_fp16, weight = layers_15_self_attn_out_proj_weight_to_fp16_palettized, x = input_193_cast_fp16)[name = tensor("linear_94_cast_fp16")]; tensor input_195_cast_fp16 = add(x = input_189_cast_fp16, y = linear_94_cast_fp16)[name = tensor("input_195_cast_fp16")]; tensor input_197_axes_0 = const()[name = tensor("input_197_axes_0"), val = tensor([-1])]; tensor layers_15_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_15_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206980096)))]; tensor layers_15_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_15_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206982208)))]; tensor input_197_cast_fp16 = layer_norm(axes = input_197_axes_0, beta = layers_15_final_layer_norm_bias_to_fp16, epsilon = var_1209_to_fp16, gamma = layers_15_final_layer_norm_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor layers_15_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206984320))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211178688))), name = tensor("layers_15_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_15_fc1_bias_to_fp16 = const()[name = tensor("layers_15_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211179264)))]; tensor linear_95_cast_fp16 = linear(bias = layers_15_fc1_bias_to_fp16, weight = layers_15_fc1_weight_to_fp16_palettized, x = input_197_cast_fp16)[name = tensor("linear_95_cast_fp16")]; tensor input_199_mode_0 = const()[name = tensor("input_199_mode_0"), val = tensor("EXACT")]; tensor input_199_cast_fp16 = gelu(mode = input_199_mode_0, x = linear_95_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor layers_15_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211187520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215381888))), name = tensor("layers_15_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_15_fc2_bias_to_fp16 = const()[name = tensor("layers_15_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215382464)))]; tensor linear_96_cast_fp16 = linear(bias = layers_15_fc2_bias_to_fp16, weight = layers_15_fc2_weight_to_fp16_palettized, x = input_199_cast_fp16)[name = tensor("linear_96_cast_fp16")]; tensor input_201_cast_fp16 = add(x = input_195_cast_fp16, y = linear_96_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor var_1276 = const()[name = tensor("op_1276"), val = tensor(-1)]; tensor x_101_axes_0 = const()[name = tensor("x_101_axes_0"), val = tensor([-1])]; tensor layers_16_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_16_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215384576)))]; tensor layers_16_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215386688)))]; tensor var_1279_to_fp16 = const()[name = tensor("op_1279_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_101_cast_fp16 = layer_norm(axes = x_101_axes_0, beta = layers_16_self_attn_layer_norm_bias_to_fp16, epsilon = var_1279_to_fp16, gamma = layers_16_self_attn_layer_norm_weight_to_fp16, x = input_201_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor layers_16_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215388800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216437440))), name = tensor("layers_16_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_16_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216438016)))]; tensor linear_97_cast_fp16 = linear(bias = layers_16_self_attn_q_proj_bias_to_fp16, weight = layers_16_self_attn_q_proj_weight_to_fp16_palettized, x = x_101_cast_fp16)[name = tensor("linear_97_cast_fp16")]; tensor concat_66x = const()[name = tensor("concat_66x"), val = tensor([1, -1, 16, 64])]; tensor var_1300_cast_fp16 = reshape(shape = concat_66x, x = linear_97_cast_fp16)[name = tensor("op_1300_cast_fp16")]; tensor layers_16_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216440128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217488768))), name = tensor("layers_16_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_16_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217489344)))]; tensor linear_98_cast_fp16 = linear(bias = layers_16_self_attn_k_proj_bias_to_fp16, weight = layers_16_self_attn_k_proj_weight_to_fp16_palettized, x = x_101_cast_fp16)[name = tensor("linear_98_cast_fp16")]; tensor concat_67x = const()[name = tensor("concat_67x"), val = tensor([1, -1, 16, 64])]; tensor var_1306_cast_fp16 = reshape(shape = concat_67x, x = linear_98_cast_fp16)[name = tensor("op_1306_cast_fp16")]; tensor layers_16_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217491456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218540096))), name = tensor("layers_16_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_16_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218540672)))]; tensor linear_99_cast_fp16 = linear(bias = layers_16_self_attn_v_proj_bias_to_fp16, weight = layers_16_self_attn_v_proj_weight_to_fp16_palettized, x = x_101_cast_fp16)[name = tensor("linear_99_cast_fp16")]; tensor concat_68x = const()[name = tensor("concat_68x"), val = tensor([1, -1, 16, 64])]; tensor var_1312_cast_fp16 = reshape(shape = concat_68x, x = linear_99_cast_fp16)[name = tensor("op_1312_cast_fp16")]; tensor v_33_perm_0 = const()[name = tensor("v_33_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1315_transpose_x_0 = const()[name = tensor("op_1315_transpose_x_0"), val = tensor(false)]; tensor var_1315_transpose_y_0 = const()[name = tensor("op_1315_transpose_y_0"), val = tensor(false)]; tensor transpose_128_perm_0 = const()[name = tensor("transpose_128_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129_perm_0 = const()[name = tensor("transpose_129_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_129 = transpose(perm = transpose_129_perm_0, x = var_1306_cast_fp16)[name = tensor("transpose_174")]; tensor transpose_128 = transpose(perm = transpose_128_perm_0, x = var_1300_cast_fp16)[name = tensor("transpose_175")]; tensor var_1315_cast_fp16 = matmul(transpose_x = var_1315_transpose_x_0, transpose_y = var_1315_transpose_y_0, x = transpose_128, y = transpose_129)[name = tensor("op_1315_cast_fp16")]; tensor var_1316_to_fp16 = const()[name = tensor("op_1316_to_fp16"), val = tensor(0x1p-3)]; tensor input_203_cast_fp16 = mul(x = var_1315_cast_fp16, y = var_1316_to_fp16)[name = tensor("input_203_cast_fp16")]; tensor attn_33_cast_fp16 = softmax(axis = var_1276, x = input_203_cast_fp16)[name = tensor("attn_33_cast_fp16")]; tensor out_33_transpose_x_0 = const()[name = tensor("out_33_transpose_x_0"), val = tensor(false)]; tensor out_33_transpose_y_0 = const()[name = tensor("out_33_transpose_y_0"), val = tensor(false)]; tensor v_33_cast_fp16 = transpose(perm = v_33_perm_0, x = var_1312_cast_fp16)[name = tensor("transpose_173")]; tensor out_33_cast_fp16 = matmul(transpose_x = out_33_transpose_x_0, transpose_y = out_33_transpose_y_0, x = attn_33_cast_fp16, y = v_33_cast_fp16)[name = tensor("out_33_cast_fp16")]; tensor var_1320_perm_0 = const()[name = tensor("op_1320_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_69x = const()[name = tensor("concat_69x"), val = tensor([1, -1, 1024])]; tensor var_1320_cast_fp16 = transpose(perm = var_1320_perm_0, x = out_33_cast_fp16)[name = tensor("transpose_172")]; tensor input_205_cast_fp16 = reshape(shape = concat_69x, x = var_1320_cast_fp16)[name = tensor("input_205_cast_fp16")]; tensor layers_16_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218542784))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219591424))), name = tensor("layers_16_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_16_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219592000)))]; tensor linear_100_cast_fp16 = linear(bias = layers_16_self_attn_out_proj_bias_to_fp16, weight = layers_16_self_attn_out_proj_weight_to_fp16_palettized, x = input_205_cast_fp16)[name = tensor("linear_100_cast_fp16")]; tensor input_207_cast_fp16 = add(x = input_201_cast_fp16, y = linear_100_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor input_209_axes_0 = const()[name = tensor("input_209_axes_0"), val = tensor([-1])]; tensor layers_16_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_16_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219594112)))]; tensor layers_16_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_16_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219596224)))]; tensor input_209_cast_fp16 = layer_norm(axes = input_209_axes_0, beta = layers_16_final_layer_norm_bias_to_fp16, epsilon = var_1279_to_fp16, gamma = layers_16_final_layer_norm_weight_to_fp16, x = input_207_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor layers_16_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219598336))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223792704))), name = tensor("layers_16_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_16_fc1_bias_to_fp16 = const()[name = tensor("layers_16_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223793280)))]; tensor linear_101_cast_fp16 = linear(bias = layers_16_fc1_bias_to_fp16, weight = layers_16_fc1_weight_to_fp16_palettized, x = input_209_cast_fp16)[name = tensor("linear_101_cast_fp16")]; tensor input_211_mode_0 = const()[name = tensor("input_211_mode_0"), val = tensor("EXACT")]; tensor input_211_cast_fp16 = gelu(mode = input_211_mode_0, x = linear_101_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor layers_16_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223801536))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227995904))), name = tensor("layers_16_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_16_fc2_bias_to_fp16 = const()[name = tensor("layers_16_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227996480)))]; tensor linear_102_cast_fp16 = linear(bias = layers_16_fc2_bias_to_fp16, weight = layers_16_fc2_weight_to_fp16_palettized, x = input_211_cast_fp16)[name = tensor("linear_102_cast_fp16")]; tensor input_213_cast_fp16 = add(x = input_207_cast_fp16, y = linear_102_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor var_1346 = const()[name = tensor("op_1346"), val = tensor(-1)]; tensor x_107_axes_0 = const()[name = tensor("x_107_axes_0"), val = tensor([-1])]; tensor layers_17_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_17_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(227998592)))]; tensor layers_17_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228000704)))]; tensor var_1349_to_fp16 = const()[name = tensor("op_1349_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_107_cast_fp16 = layer_norm(axes = x_107_axes_0, beta = layers_17_self_attn_layer_norm_bias_to_fp16, epsilon = var_1349_to_fp16, gamma = layers_17_self_attn_layer_norm_weight_to_fp16, x = input_213_cast_fp16)[name = tensor("x_107_cast_fp16")]; tensor layers_17_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228002816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(229051456))), name = tensor("layers_17_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_17_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(229052032)))]; tensor linear_103_cast_fp16 = linear(bias = layers_17_self_attn_q_proj_bias_to_fp16, weight = layers_17_self_attn_q_proj_weight_to_fp16_palettized, x = x_107_cast_fp16)[name = tensor("linear_103_cast_fp16")]; tensor concat_70x = const()[name = tensor("concat_70x"), val = tensor([1, -1, 16, 64])]; tensor var_1370_cast_fp16 = reshape(shape = concat_70x, x = linear_103_cast_fp16)[name = tensor("op_1370_cast_fp16")]; tensor layers_17_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(229054144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230102784))), name = tensor("layers_17_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_17_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230103360)))]; tensor linear_104_cast_fp16 = linear(bias = layers_17_self_attn_k_proj_bias_to_fp16, weight = layers_17_self_attn_k_proj_weight_to_fp16_palettized, x = x_107_cast_fp16)[name = tensor("linear_104_cast_fp16")]; tensor concat_71x = const()[name = tensor("concat_71x"), val = tensor([1, -1, 16, 64])]; tensor var_1376_cast_fp16 = reshape(shape = concat_71x, x = linear_104_cast_fp16)[name = tensor("op_1376_cast_fp16")]; tensor layers_17_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(230105472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(231154112))), name = tensor("layers_17_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_17_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(231154688)))]; tensor linear_105_cast_fp16 = linear(bias = layers_17_self_attn_v_proj_bias_to_fp16, weight = layers_17_self_attn_v_proj_weight_to_fp16_palettized, x = x_107_cast_fp16)[name = tensor("linear_105_cast_fp16")]; tensor concat_72x = const()[name = tensor("concat_72x"), val = tensor([1, -1, 16, 64])]; tensor var_1382_cast_fp16 = reshape(shape = concat_72x, x = linear_105_cast_fp16)[name = tensor("op_1382_cast_fp16")]; tensor v_35_perm_0 = const()[name = tensor("v_35_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1385_transpose_x_0 = const()[name = tensor("op_1385_transpose_x_0"), val = tensor(false)]; tensor var_1385_transpose_y_0 = const()[name = tensor("op_1385_transpose_y_0"), val = tensor(false)]; tensor transpose_130_perm_0 = const()[name = tensor("transpose_130_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131_perm_0 = const()[name = tensor("transpose_131_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_131 = transpose(perm = transpose_131_perm_0, x = var_1376_cast_fp16)[name = tensor("transpose_170")]; tensor transpose_130 = transpose(perm = transpose_130_perm_0, x = var_1370_cast_fp16)[name = tensor("transpose_171")]; tensor var_1385_cast_fp16 = matmul(transpose_x = var_1385_transpose_x_0, transpose_y = var_1385_transpose_y_0, x = transpose_130, y = transpose_131)[name = tensor("op_1385_cast_fp16")]; tensor var_1386_to_fp16 = const()[name = tensor("op_1386_to_fp16"), val = tensor(0x1p-3)]; tensor input_215_cast_fp16 = mul(x = var_1385_cast_fp16, y = var_1386_to_fp16)[name = tensor("input_215_cast_fp16")]; tensor attn_35_cast_fp16 = softmax(axis = var_1346, x = input_215_cast_fp16)[name = tensor("attn_35_cast_fp16")]; tensor out_35_transpose_x_0 = const()[name = tensor("out_35_transpose_x_0"), val = tensor(false)]; tensor out_35_transpose_y_0 = const()[name = tensor("out_35_transpose_y_0"), val = tensor(false)]; tensor v_35_cast_fp16 = transpose(perm = v_35_perm_0, x = var_1382_cast_fp16)[name = tensor("transpose_169")]; tensor out_35_cast_fp16 = matmul(transpose_x = out_35_transpose_x_0, transpose_y = out_35_transpose_y_0, x = attn_35_cast_fp16, y = v_35_cast_fp16)[name = tensor("out_35_cast_fp16")]; tensor var_1390_perm_0 = const()[name = tensor("op_1390_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_73x = const()[name = tensor("concat_73x"), val = tensor([1, -1, 1024])]; tensor var_1390_cast_fp16 = transpose(perm = var_1390_perm_0, x = out_35_cast_fp16)[name = tensor("transpose_168")]; tensor input_217_cast_fp16 = reshape(shape = concat_73x, x = var_1390_cast_fp16)[name = tensor("input_217_cast_fp16")]; tensor layers_17_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(231156800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232205440))), name = tensor("layers_17_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_17_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232206016)))]; tensor linear_106_cast_fp16 = linear(bias = layers_17_self_attn_out_proj_bias_to_fp16, weight = layers_17_self_attn_out_proj_weight_to_fp16_palettized, x = input_217_cast_fp16)[name = tensor("linear_106_cast_fp16")]; tensor input_219_cast_fp16 = add(x = input_213_cast_fp16, y = linear_106_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_axes_0 = const()[name = tensor("input_221_axes_0"), val = tensor([-1])]; tensor layers_17_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_17_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232208128)))]; tensor layers_17_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_17_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232210240)))]; tensor input_221_cast_fp16 = layer_norm(axes = input_221_axes_0, beta = layers_17_final_layer_norm_bias_to_fp16, epsilon = var_1349_to_fp16, gamma = layers_17_final_layer_norm_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor layers_17_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232212352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236406720))), name = tensor("layers_17_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_17_fc1_bias_to_fp16 = const()[name = tensor("layers_17_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236407296)))]; tensor linear_107_cast_fp16 = linear(bias = layers_17_fc1_bias_to_fp16, weight = layers_17_fc1_weight_to_fp16_palettized, x = input_221_cast_fp16)[name = tensor("linear_107_cast_fp16")]; tensor input_223_mode_0 = const()[name = tensor("input_223_mode_0"), val = tensor("EXACT")]; tensor input_223_cast_fp16 = gelu(mode = input_223_mode_0, x = linear_107_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor layers_17_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236415552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240609920))), name = tensor("layers_17_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_17_fc2_bias_to_fp16 = const()[name = tensor("layers_17_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240610496)))]; tensor linear_108_cast_fp16 = linear(bias = layers_17_fc2_bias_to_fp16, weight = layers_17_fc2_weight_to_fp16_palettized, x = input_223_cast_fp16)[name = tensor("linear_108_cast_fp16")]; tensor input_225_cast_fp16 = add(x = input_219_cast_fp16, y = linear_108_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor var_1416 = const()[name = tensor("op_1416"), val = tensor(-1)]; tensor x_113_axes_0 = const()[name = tensor("x_113_axes_0"), val = tensor([-1])]; tensor layers_18_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_18_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240612608)))]; tensor layers_18_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240614720)))]; tensor var_1419_to_fp16 = const()[name = tensor("op_1419_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_113_cast_fp16 = layer_norm(axes = x_113_axes_0, beta = layers_18_self_attn_layer_norm_bias_to_fp16, epsilon = var_1419_to_fp16, gamma = layers_18_self_attn_layer_norm_weight_to_fp16, x = input_225_cast_fp16)[name = tensor("x_113_cast_fp16")]; tensor layers_18_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240616832))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241665472))), name = tensor("layers_18_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_18_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241666048)))]; tensor linear_109_cast_fp16 = linear(bias = layers_18_self_attn_q_proj_bias_to_fp16, weight = layers_18_self_attn_q_proj_weight_to_fp16_palettized, x = x_113_cast_fp16)[name = tensor("linear_109_cast_fp16")]; tensor concat_74x = const()[name = tensor("concat_74x"), val = tensor([1, -1, 16, 64])]; tensor var_1440_cast_fp16 = reshape(shape = concat_74x, x = linear_109_cast_fp16)[name = tensor("op_1440_cast_fp16")]; tensor layers_18_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241668160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242716800))), name = tensor("layers_18_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_18_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242717376)))]; tensor linear_110_cast_fp16 = linear(bias = layers_18_self_attn_k_proj_bias_to_fp16, weight = layers_18_self_attn_k_proj_weight_to_fp16_palettized, x = x_113_cast_fp16)[name = tensor("linear_110_cast_fp16")]; tensor concat_75x = const()[name = tensor("concat_75x"), val = tensor([1, -1, 16, 64])]; tensor var_1446_cast_fp16 = reshape(shape = concat_75x, x = linear_110_cast_fp16)[name = tensor("op_1446_cast_fp16")]; tensor layers_18_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242719488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243768128))), name = tensor("layers_18_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_18_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243768704)))]; tensor linear_111_cast_fp16 = linear(bias = layers_18_self_attn_v_proj_bias_to_fp16, weight = layers_18_self_attn_v_proj_weight_to_fp16_palettized, x = x_113_cast_fp16)[name = tensor("linear_111_cast_fp16")]; tensor concat_76x = const()[name = tensor("concat_76x"), val = tensor([1, -1, 16, 64])]; tensor var_1452_cast_fp16 = reshape(shape = concat_76x, x = linear_111_cast_fp16)[name = tensor("op_1452_cast_fp16")]; tensor v_37_perm_0 = const()[name = tensor("v_37_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1455_transpose_x_0 = const()[name = tensor("op_1455_transpose_x_0"), val = tensor(false)]; tensor var_1455_transpose_y_0 = const()[name = tensor("op_1455_transpose_y_0"), val = tensor(false)]; tensor transpose_132_perm_0 = const()[name = tensor("transpose_132_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133_perm_0 = const()[name = tensor("transpose_133_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_133 = transpose(perm = transpose_133_perm_0, x = var_1446_cast_fp16)[name = tensor("transpose_166")]; tensor transpose_132 = transpose(perm = transpose_132_perm_0, x = var_1440_cast_fp16)[name = tensor("transpose_167")]; tensor var_1455_cast_fp16 = matmul(transpose_x = var_1455_transpose_x_0, transpose_y = var_1455_transpose_y_0, x = transpose_132, y = transpose_133)[name = tensor("op_1455_cast_fp16")]; tensor var_1456_to_fp16 = const()[name = tensor("op_1456_to_fp16"), val = tensor(0x1p-3)]; tensor input_227_cast_fp16 = mul(x = var_1455_cast_fp16, y = var_1456_to_fp16)[name = tensor("input_227_cast_fp16")]; tensor attn_37_cast_fp16 = softmax(axis = var_1416, x = input_227_cast_fp16)[name = tensor("attn_37_cast_fp16")]; tensor out_37_transpose_x_0 = const()[name = tensor("out_37_transpose_x_0"), val = tensor(false)]; tensor out_37_transpose_y_0 = const()[name = tensor("out_37_transpose_y_0"), val = tensor(false)]; tensor v_37_cast_fp16 = transpose(perm = v_37_perm_0, x = var_1452_cast_fp16)[name = tensor("transpose_165")]; tensor out_37_cast_fp16 = matmul(transpose_x = out_37_transpose_x_0, transpose_y = out_37_transpose_y_0, x = attn_37_cast_fp16, y = v_37_cast_fp16)[name = tensor("out_37_cast_fp16")]; tensor var_1460_perm_0 = const()[name = tensor("op_1460_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_77x = const()[name = tensor("concat_77x"), val = tensor([1, -1, 1024])]; tensor var_1460_cast_fp16 = transpose(perm = var_1460_perm_0, x = out_37_cast_fp16)[name = tensor("transpose_164")]; tensor input_229_cast_fp16 = reshape(shape = concat_77x, x = var_1460_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor layers_18_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(243770816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(244819456))), name = tensor("layers_18_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_18_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(244820032)))]; tensor linear_112_cast_fp16 = linear(bias = layers_18_self_attn_out_proj_bias_to_fp16, weight = layers_18_self_attn_out_proj_weight_to_fp16_palettized, x = input_229_cast_fp16)[name = tensor("linear_112_cast_fp16")]; tensor input_231_cast_fp16 = add(x = input_225_cast_fp16, y = linear_112_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor input_233_axes_0 = const()[name = tensor("input_233_axes_0"), val = tensor([-1])]; tensor layers_18_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_18_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(244822144)))]; tensor layers_18_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_18_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(244824256)))]; tensor input_233_cast_fp16 = layer_norm(axes = input_233_axes_0, beta = layers_18_final_layer_norm_bias_to_fp16, epsilon = var_1419_to_fp16, gamma = layers_18_final_layer_norm_weight_to_fp16, x = input_231_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor layers_18_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(244826368))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249020736))), name = tensor("layers_18_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_18_fc1_bias_to_fp16 = const()[name = tensor("layers_18_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249021312)))]; tensor linear_113_cast_fp16 = linear(bias = layers_18_fc1_bias_to_fp16, weight = layers_18_fc1_weight_to_fp16_palettized, x = input_233_cast_fp16)[name = tensor("linear_113_cast_fp16")]; tensor input_235_mode_0 = const()[name = tensor("input_235_mode_0"), val = tensor("EXACT")]; tensor input_235_cast_fp16 = gelu(mode = input_235_mode_0, x = linear_113_cast_fp16)[name = tensor("input_235_cast_fp16")]; tensor layers_18_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(249029568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253223936))), name = tensor("layers_18_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_18_fc2_bias_to_fp16 = const()[name = tensor("layers_18_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253224512)))]; tensor linear_114_cast_fp16 = linear(bias = layers_18_fc2_bias_to_fp16, weight = layers_18_fc2_weight_to_fp16_palettized, x = input_235_cast_fp16)[name = tensor("linear_114_cast_fp16")]; tensor input_237_cast_fp16 = add(x = input_231_cast_fp16, y = linear_114_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor var_1486 = const()[name = tensor("op_1486"), val = tensor(-1)]; tensor x_119_axes_0 = const()[name = tensor("x_119_axes_0"), val = tensor([-1])]; tensor layers_19_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_19_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253226624)))]; tensor layers_19_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253228736)))]; tensor var_1489_to_fp16 = const()[name = tensor("op_1489_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_119_cast_fp16 = layer_norm(axes = x_119_axes_0, beta = layers_19_self_attn_layer_norm_bias_to_fp16, epsilon = var_1489_to_fp16, gamma = layers_19_self_attn_layer_norm_weight_to_fp16, x = input_237_cast_fp16)[name = tensor("x_119_cast_fp16")]; tensor layers_19_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253230848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254279488))), name = tensor("layers_19_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_19_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254280064)))]; tensor linear_115_cast_fp16 = linear(bias = layers_19_self_attn_q_proj_bias_to_fp16, weight = layers_19_self_attn_q_proj_weight_to_fp16_palettized, x = x_119_cast_fp16)[name = tensor("linear_115_cast_fp16")]; tensor concat_78x = const()[name = tensor("concat_78x"), val = tensor([1, -1, 16, 64])]; tensor var_1510_cast_fp16 = reshape(shape = concat_78x, x = linear_115_cast_fp16)[name = tensor("op_1510_cast_fp16")]; tensor layers_19_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254282176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255330816))), name = tensor("layers_19_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_19_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255331392)))]; tensor linear_116_cast_fp16 = linear(bias = layers_19_self_attn_k_proj_bias_to_fp16, weight = layers_19_self_attn_k_proj_weight_to_fp16_palettized, x = x_119_cast_fp16)[name = tensor("linear_116_cast_fp16")]; tensor concat_79x = const()[name = tensor("concat_79x"), val = tensor([1, -1, 16, 64])]; tensor var_1516_cast_fp16 = reshape(shape = concat_79x, x = linear_116_cast_fp16)[name = tensor("op_1516_cast_fp16")]; tensor layers_19_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255333504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256382144))), name = tensor("layers_19_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_19_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256382720)))]; tensor linear_117_cast_fp16 = linear(bias = layers_19_self_attn_v_proj_bias_to_fp16, weight = layers_19_self_attn_v_proj_weight_to_fp16_palettized, x = x_119_cast_fp16)[name = tensor("linear_117_cast_fp16")]; tensor concat_80x = const()[name = tensor("concat_80x"), val = tensor([1, -1, 16, 64])]; tensor var_1522_cast_fp16 = reshape(shape = concat_80x, x = linear_117_cast_fp16)[name = tensor("op_1522_cast_fp16")]; tensor v_39_perm_0 = const()[name = tensor("v_39_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1525_transpose_x_0 = const()[name = tensor("op_1525_transpose_x_0"), val = tensor(false)]; tensor var_1525_transpose_y_0 = const()[name = tensor("op_1525_transpose_y_0"), val = tensor(false)]; tensor transpose_134_perm_0 = const()[name = tensor("transpose_134_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135_perm_0 = const()[name = tensor("transpose_135_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_135 = transpose(perm = transpose_135_perm_0, x = var_1516_cast_fp16)[name = tensor("transpose_162")]; tensor transpose_134 = transpose(perm = transpose_134_perm_0, x = var_1510_cast_fp16)[name = tensor("transpose_163")]; tensor var_1525_cast_fp16 = matmul(transpose_x = var_1525_transpose_x_0, transpose_y = var_1525_transpose_y_0, x = transpose_134, y = transpose_135)[name = tensor("op_1525_cast_fp16")]; tensor var_1526_to_fp16 = const()[name = tensor("op_1526_to_fp16"), val = tensor(0x1p-3)]; tensor input_239_cast_fp16 = mul(x = var_1525_cast_fp16, y = var_1526_to_fp16)[name = tensor("input_239_cast_fp16")]; tensor attn_39_cast_fp16 = softmax(axis = var_1486, x = input_239_cast_fp16)[name = tensor("attn_39_cast_fp16")]; tensor out_39_transpose_x_0 = const()[name = tensor("out_39_transpose_x_0"), val = tensor(false)]; tensor out_39_transpose_y_0 = const()[name = tensor("out_39_transpose_y_0"), val = tensor(false)]; tensor v_39_cast_fp16 = transpose(perm = v_39_perm_0, x = var_1522_cast_fp16)[name = tensor("transpose_161")]; tensor out_39_cast_fp16 = matmul(transpose_x = out_39_transpose_x_0, transpose_y = out_39_transpose_y_0, x = attn_39_cast_fp16, y = v_39_cast_fp16)[name = tensor("out_39_cast_fp16")]; tensor var_1530_perm_0 = const()[name = tensor("op_1530_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_81x = const()[name = tensor("concat_81x"), val = tensor([1, -1, 1024])]; tensor var_1530_cast_fp16 = transpose(perm = var_1530_perm_0, x = out_39_cast_fp16)[name = tensor("transpose_160")]; tensor input_241_cast_fp16 = reshape(shape = concat_81x, x = var_1530_cast_fp16)[name = tensor("input_241_cast_fp16")]; tensor layers_19_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256384832))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257433472))), name = tensor("layers_19_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_19_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257434048)))]; tensor linear_118_cast_fp16 = linear(bias = layers_19_self_attn_out_proj_bias_to_fp16, weight = layers_19_self_attn_out_proj_weight_to_fp16_palettized, x = input_241_cast_fp16)[name = tensor("linear_118_cast_fp16")]; tensor input_243_cast_fp16 = add(x = input_237_cast_fp16, y = linear_118_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor input_245_axes_0 = const()[name = tensor("input_245_axes_0"), val = tensor([-1])]; tensor layers_19_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_19_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257436160)))]; tensor layers_19_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_19_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257438272)))]; tensor input_245_cast_fp16 = layer_norm(axes = input_245_axes_0, beta = layers_19_final_layer_norm_bias_to_fp16, epsilon = var_1489_to_fp16, gamma = layers_19_final_layer_norm_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor layers_19_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257440384))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261634752))), name = tensor("layers_19_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_19_fc1_bias_to_fp16 = const()[name = tensor("layers_19_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261635328)))]; tensor linear_119_cast_fp16 = linear(bias = layers_19_fc1_bias_to_fp16, weight = layers_19_fc1_weight_to_fp16_palettized, x = input_245_cast_fp16)[name = tensor("linear_119_cast_fp16")]; tensor input_247_mode_0 = const()[name = tensor("input_247_mode_0"), val = tensor("EXACT")]; tensor input_247_cast_fp16 = gelu(mode = input_247_mode_0, x = linear_119_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor layers_19_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261643584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265837952))), name = tensor("layers_19_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_19_fc2_bias_to_fp16 = const()[name = tensor("layers_19_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265838528)))]; tensor linear_120_cast_fp16 = linear(bias = layers_19_fc2_bias_to_fp16, weight = layers_19_fc2_weight_to_fp16_palettized, x = input_247_cast_fp16)[name = tensor("linear_120_cast_fp16")]; tensor input_249_cast_fp16 = add(x = input_243_cast_fp16, y = linear_120_cast_fp16)[name = tensor("input_249_cast_fp16")]; tensor var_1556 = const()[name = tensor("op_1556"), val = tensor(-1)]; tensor x_125_axes_0 = const()[name = tensor("x_125_axes_0"), val = tensor([-1])]; tensor layers_20_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_20_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265840640)))]; tensor layers_20_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265842752)))]; tensor var_1559_to_fp16 = const()[name = tensor("op_1559_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_125_cast_fp16 = layer_norm(axes = x_125_axes_0, beta = layers_20_self_attn_layer_norm_bias_to_fp16, epsilon = var_1559_to_fp16, gamma = layers_20_self_attn_layer_norm_weight_to_fp16, x = input_249_cast_fp16)[name = tensor("x_125_cast_fp16")]; tensor layers_20_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265844864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(266893504))), name = tensor("layers_20_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_20_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(266894080)))]; tensor linear_121_cast_fp16 = linear(bias = layers_20_self_attn_q_proj_bias_to_fp16, weight = layers_20_self_attn_q_proj_weight_to_fp16_palettized, x = x_125_cast_fp16)[name = tensor("linear_121_cast_fp16")]; tensor concat_82x = const()[name = tensor("concat_82x"), val = tensor([1, -1, 16, 64])]; tensor var_1580_cast_fp16 = reshape(shape = concat_82x, x = linear_121_cast_fp16)[name = tensor("op_1580_cast_fp16")]; tensor layers_20_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(266896192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(267944832))), name = tensor("layers_20_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_20_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(267945408)))]; tensor linear_122_cast_fp16 = linear(bias = layers_20_self_attn_k_proj_bias_to_fp16, weight = layers_20_self_attn_k_proj_weight_to_fp16_palettized, x = x_125_cast_fp16)[name = tensor("linear_122_cast_fp16")]; tensor concat_83x = const()[name = tensor("concat_83x"), val = tensor([1, -1, 16, 64])]; tensor var_1586_cast_fp16 = reshape(shape = concat_83x, x = linear_122_cast_fp16)[name = tensor("op_1586_cast_fp16")]; tensor layers_20_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(267947520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268996160))), name = tensor("layers_20_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_20_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268996736)))]; tensor linear_123_cast_fp16 = linear(bias = layers_20_self_attn_v_proj_bias_to_fp16, weight = layers_20_self_attn_v_proj_weight_to_fp16_palettized, x = x_125_cast_fp16)[name = tensor("linear_123_cast_fp16")]; tensor concat_84x = const()[name = tensor("concat_84x"), val = tensor([1, -1, 16, 64])]; tensor var_1592_cast_fp16 = reshape(shape = concat_84x, x = linear_123_cast_fp16)[name = tensor("op_1592_cast_fp16")]; tensor v_41_perm_0 = const()[name = tensor("v_41_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1595_transpose_x_0 = const()[name = tensor("op_1595_transpose_x_0"), val = tensor(false)]; tensor var_1595_transpose_y_0 = const()[name = tensor("op_1595_transpose_y_0"), val = tensor(false)]; tensor transpose_136_perm_0 = const()[name = tensor("transpose_136_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137_perm_0 = const()[name = tensor("transpose_137_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_137 = transpose(perm = transpose_137_perm_0, x = var_1586_cast_fp16)[name = tensor("transpose_158")]; tensor transpose_136 = transpose(perm = transpose_136_perm_0, x = var_1580_cast_fp16)[name = tensor("transpose_159")]; tensor var_1595_cast_fp16 = matmul(transpose_x = var_1595_transpose_x_0, transpose_y = var_1595_transpose_y_0, x = transpose_136, y = transpose_137)[name = tensor("op_1595_cast_fp16")]; tensor var_1596_to_fp16 = const()[name = tensor("op_1596_to_fp16"), val = tensor(0x1p-3)]; tensor input_251_cast_fp16 = mul(x = var_1595_cast_fp16, y = var_1596_to_fp16)[name = tensor("input_251_cast_fp16")]; tensor attn_41_cast_fp16 = softmax(axis = var_1556, x = input_251_cast_fp16)[name = tensor("attn_41_cast_fp16")]; tensor out_41_transpose_x_0 = const()[name = tensor("out_41_transpose_x_0"), val = tensor(false)]; tensor out_41_transpose_y_0 = const()[name = tensor("out_41_transpose_y_0"), val = tensor(false)]; tensor v_41_cast_fp16 = transpose(perm = v_41_perm_0, x = var_1592_cast_fp16)[name = tensor("transpose_157")]; tensor out_41_cast_fp16 = matmul(transpose_x = out_41_transpose_x_0, transpose_y = out_41_transpose_y_0, x = attn_41_cast_fp16, y = v_41_cast_fp16)[name = tensor("out_41_cast_fp16")]; tensor var_1600_perm_0 = const()[name = tensor("op_1600_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_85x = const()[name = tensor("concat_85x"), val = tensor([1, -1, 1024])]; tensor var_1600_cast_fp16 = transpose(perm = var_1600_perm_0, x = out_41_cast_fp16)[name = tensor("transpose_156")]; tensor input_253_cast_fp16 = reshape(shape = concat_85x, x = var_1600_cast_fp16)[name = tensor("input_253_cast_fp16")]; tensor layers_20_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268998848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270047488))), name = tensor("layers_20_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_20_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270048064)))]; tensor linear_124_cast_fp16 = linear(bias = layers_20_self_attn_out_proj_bias_to_fp16, weight = layers_20_self_attn_out_proj_weight_to_fp16_palettized, x = input_253_cast_fp16)[name = tensor("linear_124_cast_fp16")]; tensor input_255_cast_fp16 = add(x = input_249_cast_fp16, y = linear_124_cast_fp16)[name = tensor("input_255_cast_fp16")]; tensor input_257_axes_0 = const()[name = tensor("input_257_axes_0"), val = tensor([-1])]; tensor layers_20_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_20_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270050176)))]; tensor layers_20_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_20_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270052288)))]; tensor input_257_cast_fp16 = layer_norm(axes = input_257_axes_0, beta = layers_20_final_layer_norm_bias_to_fp16, epsilon = var_1559_to_fp16, gamma = layers_20_final_layer_norm_weight_to_fp16, x = input_255_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor layers_20_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270054400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274248768))), name = tensor("layers_20_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_20_fc1_bias_to_fp16 = const()[name = tensor("layers_20_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274249344)))]; tensor linear_125_cast_fp16 = linear(bias = layers_20_fc1_bias_to_fp16, weight = layers_20_fc1_weight_to_fp16_palettized, x = input_257_cast_fp16)[name = tensor("linear_125_cast_fp16")]; tensor input_259_mode_0 = const()[name = tensor("input_259_mode_0"), val = tensor("EXACT")]; tensor input_259_cast_fp16 = gelu(mode = input_259_mode_0, x = linear_125_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor layers_20_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(274257600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278451968))), name = tensor("layers_20_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_20_fc2_bias_to_fp16 = const()[name = tensor("layers_20_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278452544)))]; tensor linear_126_cast_fp16 = linear(bias = layers_20_fc2_bias_to_fp16, weight = layers_20_fc2_weight_to_fp16_palettized, x = input_259_cast_fp16)[name = tensor("linear_126_cast_fp16")]; tensor input_261_cast_fp16 = add(x = input_255_cast_fp16, y = linear_126_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor var_1626 = const()[name = tensor("op_1626"), val = tensor(-1)]; tensor x_131_axes_0 = const()[name = tensor("x_131_axes_0"), val = tensor([-1])]; tensor layers_21_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_21_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278454656)))]; tensor layers_21_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278456768)))]; tensor var_1629_to_fp16 = const()[name = tensor("op_1629_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_131_cast_fp16 = layer_norm(axes = x_131_axes_0, beta = layers_21_self_attn_layer_norm_bias_to_fp16, epsilon = var_1629_to_fp16, gamma = layers_21_self_attn_layer_norm_weight_to_fp16, x = input_261_cast_fp16)[name = tensor("x_131_cast_fp16")]; tensor layers_21_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278458880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279507520))), name = tensor("layers_21_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_21_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279508096)))]; tensor linear_127_cast_fp16 = linear(bias = layers_21_self_attn_q_proj_bias_to_fp16, weight = layers_21_self_attn_q_proj_weight_to_fp16_palettized, x = x_131_cast_fp16)[name = tensor("linear_127_cast_fp16")]; tensor concat_86x = const()[name = tensor("concat_86x"), val = tensor([1, -1, 16, 64])]; tensor var_1650_cast_fp16 = reshape(shape = concat_86x, x = linear_127_cast_fp16)[name = tensor("op_1650_cast_fp16")]; tensor layers_21_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279510208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(280558848))), name = tensor("layers_21_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_21_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(280559424)))]; tensor linear_128_cast_fp16 = linear(bias = layers_21_self_attn_k_proj_bias_to_fp16, weight = layers_21_self_attn_k_proj_weight_to_fp16_palettized, x = x_131_cast_fp16)[name = tensor("linear_128_cast_fp16")]; tensor concat_87x = const()[name = tensor("concat_87x"), val = tensor([1, -1, 16, 64])]; tensor var_1656_cast_fp16 = reshape(shape = concat_87x, x = linear_128_cast_fp16)[name = tensor("op_1656_cast_fp16")]; tensor layers_21_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(280561536))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281610176))), name = tensor("layers_21_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_21_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281610752)))]; tensor linear_129_cast_fp16 = linear(bias = layers_21_self_attn_v_proj_bias_to_fp16, weight = layers_21_self_attn_v_proj_weight_to_fp16_palettized, x = x_131_cast_fp16)[name = tensor("linear_129_cast_fp16")]; tensor concat_88x = const()[name = tensor("concat_88x"), val = tensor([1, -1, 16, 64])]; tensor var_1662_cast_fp16 = reshape(shape = concat_88x, x = linear_129_cast_fp16)[name = tensor("op_1662_cast_fp16")]; tensor v_43_perm_0 = const()[name = tensor("v_43_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1665_transpose_x_0 = const()[name = tensor("op_1665_transpose_x_0"), val = tensor(false)]; tensor var_1665_transpose_y_0 = const()[name = tensor("op_1665_transpose_y_0"), val = tensor(false)]; tensor transpose_138_perm_0 = const()[name = tensor("transpose_138_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139_perm_0 = const()[name = tensor("transpose_139_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_139 = transpose(perm = transpose_139_perm_0, x = var_1656_cast_fp16)[name = tensor("transpose_154")]; tensor transpose_138 = transpose(perm = transpose_138_perm_0, x = var_1650_cast_fp16)[name = tensor("transpose_155")]; tensor var_1665_cast_fp16 = matmul(transpose_x = var_1665_transpose_x_0, transpose_y = var_1665_transpose_y_0, x = transpose_138, y = transpose_139)[name = tensor("op_1665_cast_fp16")]; tensor var_1666_to_fp16 = const()[name = tensor("op_1666_to_fp16"), val = tensor(0x1p-3)]; tensor input_263_cast_fp16 = mul(x = var_1665_cast_fp16, y = var_1666_to_fp16)[name = tensor("input_263_cast_fp16")]; tensor attn_43_cast_fp16 = softmax(axis = var_1626, x = input_263_cast_fp16)[name = tensor("attn_43_cast_fp16")]; tensor out_43_transpose_x_0 = const()[name = tensor("out_43_transpose_x_0"), val = tensor(false)]; tensor out_43_transpose_y_0 = const()[name = tensor("out_43_transpose_y_0"), val = tensor(false)]; tensor v_43_cast_fp16 = transpose(perm = v_43_perm_0, x = var_1662_cast_fp16)[name = tensor("transpose_153")]; tensor out_43_cast_fp16 = matmul(transpose_x = out_43_transpose_x_0, transpose_y = out_43_transpose_y_0, x = attn_43_cast_fp16, y = v_43_cast_fp16)[name = tensor("out_43_cast_fp16")]; tensor var_1670_perm_0 = const()[name = tensor("op_1670_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_89x = const()[name = tensor("concat_89x"), val = tensor([1, -1, 1024])]; tensor var_1670_cast_fp16 = transpose(perm = var_1670_perm_0, x = out_43_cast_fp16)[name = tensor("transpose_152")]; tensor input_265_cast_fp16 = reshape(shape = concat_89x, x = var_1670_cast_fp16)[name = tensor("input_265_cast_fp16")]; tensor layers_21_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(281612864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(282661504))), name = tensor("layers_21_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_21_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(282662080)))]; tensor linear_130_cast_fp16 = linear(bias = layers_21_self_attn_out_proj_bias_to_fp16, weight = layers_21_self_attn_out_proj_weight_to_fp16_palettized, x = input_265_cast_fp16)[name = tensor("linear_130_cast_fp16")]; tensor input_267_cast_fp16 = add(x = input_261_cast_fp16, y = linear_130_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor input_269_axes_0 = const()[name = tensor("input_269_axes_0"), val = tensor([-1])]; tensor layers_21_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_21_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(282664192)))]; tensor layers_21_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_21_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(282666304)))]; tensor input_269_cast_fp16 = layer_norm(axes = input_269_axes_0, beta = layers_21_final_layer_norm_bias_to_fp16, epsilon = var_1629_to_fp16, gamma = layers_21_final_layer_norm_weight_to_fp16, x = input_267_cast_fp16)[name = tensor("input_269_cast_fp16")]; tensor layers_21_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(282668416))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286862784))), name = tensor("layers_21_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_21_fc1_bias_to_fp16 = const()[name = tensor("layers_21_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286863360)))]; tensor linear_131_cast_fp16 = linear(bias = layers_21_fc1_bias_to_fp16, weight = layers_21_fc1_weight_to_fp16_palettized, x = input_269_cast_fp16)[name = tensor("linear_131_cast_fp16")]; tensor input_271_mode_0 = const()[name = tensor("input_271_mode_0"), val = tensor("EXACT")]; tensor input_271_cast_fp16 = gelu(mode = input_271_mode_0, x = linear_131_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor layers_21_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286871616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291065984))), name = tensor("layers_21_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_21_fc2_bias_to_fp16 = const()[name = tensor("layers_21_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291066560)))]; tensor linear_132_cast_fp16 = linear(bias = layers_21_fc2_bias_to_fp16, weight = layers_21_fc2_weight_to_fp16_palettized, x = input_271_cast_fp16)[name = tensor("linear_132_cast_fp16")]; tensor input_273_cast_fp16 = add(x = input_267_cast_fp16, y = linear_132_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor var_1696 = const()[name = tensor("op_1696"), val = tensor(-1)]; tensor x_137_axes_0 = const()[name = tensor("x_137_axes_0"), val = tensor([-1])]; tensor layers_22_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_22_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291068672)))]; tensor layers_22_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291070784)))]; tensor var_1699_to_fp16 = const()[name = tensor("op_1699_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_137_cast_fp16 = layer_norm(axes = x_137_axes_0, beta = layers_22_self_attn_layer_norm_bias_to_fp16, epsilon = var_1699_to_fp16, gamma = layers_22_self_attn_layer_norm_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("x_137_cast_fp16")]; tensor layers_22_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291072896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292121536))), name = tensor("layers_22_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_22_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292122112)))]; tensor linear_133_cast_fp16 = linear(bias = layers_22_self_attn_q_proj_bias_to_fp16, weight = layers_22_self_attn_q_proj_weight_to_fp16_palettized, x = x_137_cast_fp16)[name = tensor("linear_133_cast_fp16")]; tensor concat_90x = const()[name = tensor("concat_90x"), val = tensor([1, -1, 16, 64])]; tensor var_1720_cast_fp16 = reshape(shape = concat_90x, x = linear_133_cast_fp16)[name = tensor("op_1720_cast_fp16")]; tensor layers_22_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292124224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293172864))), name = tensor("layers_22_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_22_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293173440)))]; tensor linear_134_cast_fp16 = linear(bias = layers_22_self_attn_k_proj_bias_to_fp16, weight = layers_22_self_attn_k_proj_weight_to_fp16_palettized, x = x_137_cast_fp16)[name = tensor("linear_134_cast_fp16")]; tensor concat_91x = const()[name = tensor("concat_91x"), val = tensor([1, -1, 16, 64])]; tensor var_1726_cast_fp16 = reshape(shape = concat_91x, x = linear_134_cast_fp16)[name = tensor("op_1726_cast_fp16")]; tensor layers_22_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293175552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294224192))), name = tensor("layers_22_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_22_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294224768)))]; tensor linear_135_cast_fp16 = linear(bias = layers_22_self_attn_v_proj_bias_to_fp16, weight = layers_22_self_attn_v_proj_weight_to_fp16_palettized, x = x_137_cast_fp16)[name = tensor("linear_135_cast_fp16")]; tensor concat_92x = const()[name = tensor("concat_92x"), val = tensor([1, -1, 16, 64])]; tensor var_1732_cast_fp16 = reshape(shape = concat_92x, x = linear_135_cast_fp16)[name = tensor("op_1732_cast_fp16")]; tensor v_45_perm_0 = const()[name = tensor("v_45_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1735_transpose_x_0 = const()[name = tensor("op_1735_transpose_x_0"), val = tensor(false)]; tensor var_1735_transpose_y_0 = const()[name = tensor("op_1735_transpose_y_0"), val = tensor(false)]; tensor transpose_140_perm_0 = const()[name = tensor("transpose_140_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141_perm_0 = const()[name = tensor("transpose_141_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_141 = transpose(perm = transpose_141_perm_0, x = var_1726_cast_fp16)[name = tensor("transpose_150")]; tensor transpose_140 = transpose(perm = transpose_140_perm_0, x = var_1720_cast_fp16)[name = tensor("transpose_151")]; tensor var_1735_cast_fp16 = matmul(transpose_x = var_1735_transpose_x_0, transpose_y = var_1735_transpose_y_0, x = transpose_140, y = transpose_141)[name = tensor("op_1735_cast_fp16")]; tensor var_1736_to_fp16 = const()[name = tensor("op_1736_to_fp16"), val = tensor(0x1p-3)]; tensor input_275_cast_fp16 = mul(x = var_1735_cast_fp16, y = var_1736_to_fp16)[name = tensor("input_275_cast_fp16")]; tensor attn_45_cast_fp16 = softmax(axis = var_1696, x = input_275_cast_fp16)[name = tensor("attn_45_cast_fp16")]; tensor out_45_transpose_x_0 = const()[name = tensor("out_45_transpose_x_0"), val = tensor(false)]; tensor out_45_transpose_y_0 = const()[name = tensor("out_45_transpose_y_0"), val = tensor(false)]; tensor v_45_cast_fp16 = transpose(perm = v_45_perm_0, x = var_1732_cast_fp16)[name = tensor("transpose_149")]; tensor out_45_cast_fp16 = matmul(transpose_x = out_45_transpose_x_0, transpose_y = out_45_transpose_y_0, x = attn_45_cast_fp16, y = v_45_cast_fp16)[name = tensor("out_45_cast_fp16")]; tensor var_1740_perm_0 = const()[name = tensor("op_1740_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_93x = const()[name = tensor("concat_93x"), val = tensor([1, -1, 1024])]; tensor var_1740_cast_fp16 = transpose(perm = var_1740_perm_0, x = out_45_cast_fp16)[name = tensor("transpose_148")]; tensor input_277_cast_fp16 = reshape(shape = concat_93x, x = var_1740_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor layers_22_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294226880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295275520))), name = tensor("layers_22_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_22_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295276096)))]; tensor linear_136_cast_fp16 = linear(bias = layers_22_self_attn_out_proj_bias_to_fp16, weight = layers_22_self_attn_out_proj_weight_to_fp16_palettized, x = input_277_cast_fp16)[name = tensor("linear_136_cast_fp16")]; tensor input_279_cast_fp16 = add(x = input_273_cast_fp16, y = linear_136_cast_fp16)[name = tensor("input_279_cast_fp16")]; tensor input_281_axes_0 = const()[name = tensor("input_281_axes_0"), val = tensor([-1])]; tensor layers_22_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_22_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295278208)))]; tensor layers_22_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_22_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295280320)))]; tensor input_281_cast_fp16 = layer_norm(axes = input_281_axes_0, beta = layers_22_final_layer_norm_bias_to_fp16, epsilon = var_1699_to_fp16, gamma = layers_22_final_layer_norm_weight_to_fp16, x = input_279_cast_fp16)[name = tensor("input_281_cast_fp16")]; tensor layers_22_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295282432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299476800))), name = tensor("layers_22_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_22_fc1_bias_to_fp16 = const()[name = tensor("layers_22_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299477376)))]; tensor linear_137_cast_fp16 = linear(bias = layers_22_fc1_bias_to_fp16, weight = layers_22_fc1_weight_to_fp16_palettized, x = input_281_cast_fp16)[name = tensor("linear_137_cast_fp16")]; tensor input_283_mode_0 = const()[name = tensor("input_283_mode_0"), val = tensor("EXACT")]; tensor input_283_cast_fp16 = gelu(mode = input_283_mode_0, x = linear_137_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor layers_22_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299485632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303680000))), name = tensor("layers_22_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_22_fc2_bias_to_fp16 = const()[name = tensor("layers_22_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303680576)))]; tensor linear_138_cast_fp16 = linear(bias = layers_22_fc2_bias_to_fp16, weight = layers_22_fc2_weight_to_fp16_palettized, x = input_283_cast_fp16)[name = tensor("linear_138_cast_fp16")]; tensor input_285_cast_fp16 = add(x = input_279_cast_fp16, y = linear_138_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor var_1766 = const()[name = tensor("op_1766"), val = tensor(-1)]; tensor x_143_axes_0 = const()[name = tensor("x_143_axes_0"), val = tensor([-1])]; tensor layers_23_self_attn_layer_norm_weight_to_fp16 = const()[name = tensor("layers_23_self_attn_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303682688)))]; tensor layers_23_self_attn_layer_norm_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303684800)))]; tensor var_1769_to_fp16 = const()[name = tensor("op_1769_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_143_cast_fp16 = layer_norm(axes = x_143_axes_0, beta = layers_23_self_attn_layer_norm_bias_to_fp16, epsilon = var_1769_to_fp16, gamma = layers_23_self_attn_layer_norm_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("x_143_cast_fp16")]; tensor layers_23_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303686912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304735552))), name = tensor("layers_23_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_23_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304736128)))]; tensor linear_139_cast_fp16 = linear(bias = layers_23_self_attn_q_proj_bias_to_fp16, weight = layers_23_self_attn_q_proj_weight_to_fp16_palettized, x = x_143_cast_fp16)[name = tensor("linear_139_cast_fp16")]; tensor concat_94x = const()[name = tensor("concat_94x"), val = tensor([1, -1, 16, 64])]; tensor var_1790_cast_fp16 = reshape(shape = concat_94x, x = linear_139_cast_fp16)[name = tensor("op_1790_cast_fp16")]; tensor layers_23_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304738240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(305786880))), name = tensor("layers_23_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_23_self_attn_k_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(305787456)))]; tensor linear_140_cast_fp16 = linear(bias = layers_23_self_attn_k_proj_bias_to_fp16, weight = layers_23_self_attn_k_proj_weight_to_fp16_palettized, x = x_143_cast_fp16)[name = tensor("linear_140_cast_fp16")]; tensor concat_95x = const()[name = tensor("concat_95x"), val = tensor([1, -1, 16, 64])]; tensor var_1796_cast_fp16 = reshape(shape = concat_95x, x = linear_140_cast_fp16)[name = tensor("op_1796_cast_fp16")]; tensor layers_23_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(305789568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(306838208))), name = tensor("layers_23_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_23_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(306838784)))]; tensor linear_141_cast_fp16 = linear(bias = layers_23_self_attn_v_proj_bias_to_fp16, weight = layers_23_self_attn_v_proj_weight_to_fp16_palettized, x = x_143_cast_fp16)[name = tensor("linear_141_cast_fp16")]; tensor concat_96x = const()[name = tensor("concat_96x"), val = tensor([1, -1, 16, 64])]; tensor var_1802_cast_fp16 = reshape(shape = concat_96x, x = linear_141_cast_fp16)[name = tensor("op_1802_cast_fp16")]; tensor v_perm_0 = const()[name = tensor("v_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1805_transpose_x_0 = const()[name = tensor("op_1805_transpose_x_0"), val = tensor(false)]; tensor var_1805_transpose_y_0 = const()[name = tensor("op_1805_transpose_y_0"), val = tensor(false)]; tensor transpose_142_perm_0 = const()[name = tensor("transpose_142_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143_perm_0 = const()[name = tensor("transpose_143_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_143 = transpose(perm = transpose_143_perm_0, x = var_1796_cast_fp16)[name = tensor("transpose_146")]; tensor transpose_142 = transpose(perm = transpose_142_perm_0, x = var_1790_cast_fp16)[name = tensor("transpose_147")]; tensor var_1805_cast_fp16 = matmul(transpose_x = var_1805_transpose_x_0, transpose_y = var_1805_transpose_y_0, x = transpose_142, y = transpose_143)[name = tensor("op_1805_cast_fp16")]; tensor var_1806_to_fp16 = const()[name = tensor("op_1806_to_fp16"), val = tensor(0x1p-3)]; tensor input_287_cast_fp16 = mul(x = var_1805_cast_fp16, y = var_1806_to_fp16)[name = tensor("input_287_cast_fp16")]; tensor attn_cast_fp16 = softmax(axis = var_1766, x = input_287_cast_fp16)[name = tensor("attn_cast_fp16")]; tensor out_transpose_x_0 = const()[name = tensor("out_transpose_x_0"), val = tensor(false)]; tensor out_transpose_y_0 = const()[name = tensor("out_transpose_y_0"), val = tensor(false)]; tensor v_cast_fp16 = transpose(perm = v_perm_0, x = var_1802_cast_fp16)[name = tensor("transpose_145")]; tensor out_cast_fp16 = matmul(transpose_x = out_transpose_x_0, transpose_y = out_transpose_y_0, x = attn_cast_fp16, y = v_cast_fp16)[name = tensor("out_cast_fp16")]; tensor var_1810_perm_0 = const()[name = tensor("op_1810_perm_0"), val = tensor([0, 2, 1, 3])]; tensor concat_97x = const()[name = tensor("concat_97x"), val = tensor([1, -1, 1024])]; tensor var_1810_cast_fp16 = transpose(perm = var_1810_perm_0, x = out_cast_fp16)[name = tensor("transpose_144")]; tensor input_289_cast_fp16 = reshape(shape = concat_97x, x = var_1810_cast_fp16)[name = tensor("input_289_cast_fp16")]; tensor layers_23_self_attn_out_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(306840896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307889536))), name = tensor("layers_23_self_attn_out_proj_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor layers_23_self_attn_out_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307890112)))]; tensor linear_142_cast_fp16 = linear(bias = layers_23_self_attn_out_proj_bias_to_fp16, weight = layers_23_self_attn_out_proj_weight_to_fp16_palettized, x = input_289_cast_fp16)[name = tensor("linear_142_cast_fp16")]; tensor input_291_cast_fp16 = add(x = input_285_cast_fp16, y = linear_142_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor input_293_axes_0 = const()[name = tensor("input_293_axes_0"), val = tensor([-1])]; tensor layers_23_final_layer_norm_weight_to_fp16 = const()[name = tensor("layers_23_final_layer_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307892224)))]; tensor layers_23_final_layer_norm_bias_to_fp16 = const()[name = tensor("layers_23_final_layer_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307894336)))]; tensor input_293_cast_fp16 = layer_norm(axes = input_293_axes_0, beta = layers_23_final_layer_norm_bias_to_fp16, epsilon = var_1769_to_fp16, gamma = layers_23_final_layer_norm_weight_to_fp16, x = input_291_cast_fp16)[name = tensor("input_293_cast_fp16")]; tensor layers_23_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(307896448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312090816))), name = tensor("layers_23_fc1_weight_to_fp16_palettized"), shape = tensor([4096, 1024])]; tensor layers_23_fc1_bias_to_fp16 = const()[name = tensor("layers_23_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312091392)))]; tensor linear_143_cast_fp16 = linear(bias = layers_23_fc1_bias_to_fp16, weight = layers_23_fc1_weight_to_fp16_palettized, x = input_293_cast_fp16)[name = tensor("linear_143_cast_fp16")]; tensor input_295_mode_0 = const()[name = tensor("input_295_mode_0"), val = tensor("EXACT")]; tensor input_295_cast_fp16 = gelu(mode = input_295_mode_0, x = linear_143_cast_fp16)[name = tensor("input_295_cast_fp16")]; tensor layers_23_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312099648))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316294016))), name = tensor("layers_23_fc2_weight_to_fp16_palettized"), shape = tensor([1024, 4096])]; tensor layers_23_fc2_bias_to_fp16 = const()[name = tensor("layers_23_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316294592)))]; tensor linear_144_cast_fp16 = linear(bias = layers_23_fc2_bias_to_fp16, weight = layers_23_fc2_weight_to_fp16_palettized, x = input_295_cast_fp16)[name = tensor("linear_144_cast_fp16")]; tensor input_297_cast_fp16 = add(x = input_291_cast_fp16, y = linear_144_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor input_299_axes_0 = const()[name = tensor("input_299_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316296704)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316298816)))]; tensor var_1830_to_fp16 = const()[name = tensor("op_1830_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_299_cast_fp16 = layer_norm(axes = input_299_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_1830_to_fp16, gamma = ln_post_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("input_299_cast_fp16")]; tensor proj1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316300928))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(317349568))), name = tensor("proj1_weight_to_fp16_palettized"), shape = tensor([1024, 1024])]; tensor proj1_bias_to_fp16 = const()[name = tensor("proj1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(317350144)))]; tensor linear_145_cast_fp16 = linear(bias = proj1_bias_to_fp16, weight = proj1_weight_to_fp16_palettized, x = input_299_cast_fp16)[name = tensor("linear_145_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = linear_145_cast_fp16)[name = tensor("input_cast_fp16")]; tensor proj2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(317352256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319449472))), name = tensor("proj2_weight_to_fp16_palettized"), shape = tensor([2048, 1024])]; tensor proj2_bias_to_fp16 = const()[name = tensor("proj2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319450048)))]; tensor audio_embeddings = linear(bias = proj2_bias_to_fp16, weight = proj2_weight_to_fp16_palettized, x = input_cast_fp16)[name = tensor("linear_146_cast_fp16")]; } -> (audio_embeddings); }