program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}})] { func main(tensor ac, tensor elen, tensor enc, tensor tn) { tensor var_20 = const()[name = tensor("op_20"), val = tensor(-1)]; tensor const_1 = const()[name = tensor("const_1"), val = tensor([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127])]; tensor matrix_1_axes_0 = const()[name = tensor("matrix_1_axes_0"), val = tensor([-1])]; tensor matrix_1 = expand_dims(axes = matrix_1_axes_0, x = tn)[name = tensor("matrix_1")]; tensor mask_1 = less(x = const_1, y = matrix_1)[name = tensor("mask_1")]; tensor mask_9_axes_0 = const()[name = tensor("mask_9_axes_0"), val = tensor([2])]; tensor cast_0_to_fp16_dtype_0 = const()[name = tensor("cast_0_to_fp16_dtype_0"), val = tensor("fp16")]; tensor mask_1_to_fp16 = cast(dtype = cast_0_to_fp16_dtype_0, x = mask_1)[name = tensor("cast_3")]; tensor mask_9_cast_fp16 = expand_dims(axes = mask_9_axes_0, x = mask_1_to_fp16)[name = tensor("mask_9_cast_fp16")]; tensor const_3 = const()[name = tensor("const_3"), val = tensor([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300, 301, 302, 303, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315, 316, 317, 318, 319, 320, 321, 322, 323, 324, 325, 326, 327, 328, 329, 330, 331, 332, 333, 334, 335, 336, 337, 338, 339, 340, 341, 342, 343, 344, 345, 346, 347, 348, 349, 350, 351, 352, 353, 354, 355, 356, 357, 358, 359, 360, 361, 362, 363, 364, 365, 366, 367, 368, 369, 370, 371, 372, 373, 374, 375, 376, 377, 378, 379, 380, 381, 382, 383, 384, 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427, 428, 429, 430, 431, 432, 433, 434, 435, 436, 437, 438, 439, 440, 441, 442, 443, 444, 445, 446, 447, 448, 449, 450, 451, 452, 453, 454, 455, 456, 457, 458, 459, 460, 461, 462, 463, 464, 465, 466, 467, 468, 469, 470, 471, 472, 473, 474, 475, 476, 477, 478, 479, 480, 481, 482, 483, 484, 485, 486, 487, 488, 489, 490, 491, 492, 493, 494, 495, 496, 497, 498, 499, 500, 501, 502, 503, 504, 505, 506, 507, 508, 509, 510, 511])]; tensor matrix_axes_0 = const()[name = tensor("matrix_axes_0"), val = tensor([-1])]; tensor matrix = expand_dims(axes = matrix_axes_0, x = elen)[name = tensor("matrix")]; tensor mask_5 = less(x = const_3, y = matrix)[name = tensor("mask_5")]; tensor var_51_axes_0 = const()[name = tensor("op_51_axes_0"), val = tensor([1])]; tensor cast_2_to_fp16_dtype_0 = const()[name = tensor("cast_2_to_fp16_dtype_0"), val = tensor("fp16")]; tensor mask_5_to_fp16 = cast(dtype = cast_2_to_fp16_dtype_0, x = mask_5)[name = tensor("cast_2")]; tensor var_51_cast_fp16 = expand_dims(axes = var_51_axes_0, x = mask_5_to_fp16)[name = tensor("op_51_cast_fp16")]; tensor input_1_axes_0 = const()[name = tensor("input_1_axes_0"), val = tensor([-1])]; tensor ac_to_fp16_dtype_0 = const()[name = tensor("ac_to_fp16_dtype_0"), val = tensor("fp16")]; tensor d_decoders_0_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_0_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor d_decoders_0_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_0_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1152)))]; tensor var_15_to_fp16 = const()[name = tensor("op_15_to_fp16"), val = tensor(0x1p-24)]; tensor ac_to_fp16 = cast(dtype = ac_to_fp16_dtype_0, x = ac)[name = tensor("cast_1")]; tensor input_1_cast_fp16 = layer_norm(axes = input_1_axes_0, beta = d_decoders_0_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_0_norm1_weight_to_fp16, x = ac_to_fp16)[name = tensor("input_1_cast_fp16")]; tensor d_decoders_0_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2240))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1052992))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_0_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_0_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1057152)))]; tensor linear_0_cast_fp16 = linear(bias = d_decoders_0_feed_forward_w_1_bias_to_fp16, weight = d_decoders_0_feed_forward_w_1_weight_to_fp16_quantized, x = input_1_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor input_5_cast_fp16 = relu(x = linear_0_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor input_9_axes_0 = const()[name = tensor("input_9_axes_0"), val = tensor([-1])]; tensor d_decoders_0_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_0_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1061312)))]; tensor d_decoders_0_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_0_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1065472)))]; tensor input_9_cast_fp16 = layer_norm(axes = input_9_axes_0, beta = d_decoders_0_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_0_feed_forward_norm_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor d_decoders_0_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1069632))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118848))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2119936)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_0_feed_forward_w_2_weight_to_fp16_quantized, x = input_9_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor inputs_1_axes_0 = const()[name = tensor("inputs_1_axes_0"), val = tensor([-1])]; tensor d_decoders_0_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_0_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2121024)))]; tensor d_decoders_0_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_0_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2122112)))]; tensor inputs_1_cast_fp16 = layer_norm(axes = inputs_1_axes_0, beta = d_decoders_0_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_0_norm2_weight_to_fp16, x = linear_1_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor inputs_3_cast_fp16 = mul(x = inputs_1_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor x_1_perm_0 = const()[name = tensor("x_1_perm_0"), val = tensor([0, 2, 1])]; tensor input_13_pad_0 = const()[name = tensor("input_13_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_13_mode_0 = const()[name = tensor("input_13_mode_0"), val = tensor("constant")]; tensor const_5_to_fp16 = const()[name = tensor("const_5_to_fp16"), val = tensor(0x0p+0)]; tensor x_1_cast_fp16 = transpose(perm = x_1_perm_0, x = inputs_3_cast_fp16)[name = tensor("transpose_191")]; tensor input_13_cast_fp16 = pad(constant_val = const_5_to_fp16, mode = input_13_mode_0, pad = input_13_pad_0, x = x_1_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor x_3_pad_type_0 = const()[name = tensor("x_3_pad_type_0"), val = tensor("valid")]; tensor x_3_groups_0 = const()[name = tensor("x_3_groups_0"), val = tensor(512)]; tensor x_3_strides_0 = const()[name = tensor("x_3_strides_0"), val = tensor([1])]; tensor x_3_pad_0 = const()[name = tensor("x_3_pad_0"), val = tensor([0, 0])]; tensor x_3_dilations_0 = const()[name = tensor("x_3_dilations_0"), val = tensor([1])]; tensor d_decoders_0_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2123200))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2128896))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_3_cast_fp16 = conv(dilations = x_3_dilations_0, groups = x_3_groups_0, pad = x_3_pad_0, pad_type = x_3_pad_type_0, strides = x_3_strides_0, weight = d_decoders_0_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_13_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor x_5_perm_0 = const()[name = tensor("x_5_perm_0"), val = tensor([0, 2, 1])]; tensor x_5_cast_fp16 = transpose(perm = x_5_perm_0, x = x_3_cast_fp16)[name = tensor("transpose_190")]; tensor input_15_cast_fp16 = add(x = x_5_cast_fp16, y = inputs_3_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor input_17_cast_fp16 = mul(x = input_15_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_cast_fp16 = add(x = ac_to_fp16, y = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor x_11_axes_0 = const()[name = tensor("x_11_axes_0"), val = tensor([-1])]; tensor d_decoders_0_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_0_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2129984)))]; tensor d_decoders_0_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_0_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2131072)))]; tensor x_11_cast_fp16 = layer_norm(axes = x_11_axes_0, beta = d_decoders_0_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_0_norm3_weight_to_fp16, x = input_19_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor d_decoders_0_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2132160))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2394368))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_0_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_0_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2395456)))]; tensor linear_2_cast_fp16 = linear(bias = d_decoders_0_src_attn_linear_q_bias_to_fp16, weight = d_decoders_0_src_attn_linear_q_weight_to_fp16_quantized, x = x_11_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_128 = const()[name = tensor("op_128"), val = tensor([1, -1, 4, 128])]; tensor var_129_cast_fp16 = reshape(shape = var_128, x = linear_2_cast_fp16)[name = tensor("op_129_cast_fp16")]; tensor enc_to_fp16_dtype_0 = const()[name = tensor("enc_to_fp16_dtype_0"), val = tensor("fp16")]; tensor d_decoders_0_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2396544))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2921984))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_0_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_0_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2924096)))]; tensor enc_to_fp16 = cast(dtype = enc_to_fp16_dtype_0, x = enc)[name = tensor("cast_0")]; tensor linear_3_cast_fp16 = linear(bias = d_decoders_0_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_0_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_3_cast_fp16")]; tensor tile_0 = const()[name = tensor("tile_0"), val = tensor([512, 512])]; tensor var_134_axis_0 = const()[name = tensor("op_134_axis_0"), val = tensor(-1)]; tensor var_134_cast_fp16_0, tensor var_134_cast_fp16_1 = split(axis = var_134_axis_0, split_sizes = tile_0, x = linear_3_cast_fp16)[name = tensor("op_134_cast_fp16")]; tensor var_137 = const()[name = tensor("op_137"), val = tensor([1, -1, 4, 128])]; tensor var_138_cast_fp16 = reshape(shape = var_137, x = var_134_cast_fp16_0)[name = tensor("op_138_cast_fp16")]; tensor var_140 = const()[name = tensor("op_140"), val = tensor([1, -1, 4, 128])]; tensor var_141_cast_fp16 = reshape(shape = var_140, x = var_134_cast_fp16_1)[name = tensor("op_141_cast_fp16")]; tensor value_1_perm_0 = const()[name = tensor("value_1_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_143_to_fp16 = const()[name = tensor("op_143_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_3_cast_fp16 = mul(x = var_129_cast_fp16, y = var_143_to_fp16)[name = tensor("q_h_3_cast_fp16")]; tensor scores_1_transpose_x_0 = const()[name = tensor("scores_1_transpose_x_0"), val = tensor(false)]; tensor scores_1_transpose_y_0 = const()[name = tensor("scores_1_transpose_y_0"), val = tensor(false)]; tensor transpose_64_perm_0 = const()[name = tensor("transpose_64_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_65_perm_0 = const()[name = tensor("transpose_65_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_65 = transpose(perm = transpose_65_perm_0, x = var_138_cast_fp16)[name = tensor("transpose_188")]; tensor transpose_64 = transpose(perm = transpose_64_perm_0, x = q_h_3_cast_fp16)[name = tensor("transpose_189")]; tensor scores_1_cast_fp16 = matmul(transpose_x = scores_1_transpose_x_0, transpose_y = scores_1_transpose_y_0, x = transpose_64, y = transpose_65)[name = tensor("scores_1_cast_fp16")]; tensor var_148_axes_0 = const()[name = tensor("op_148_axes_0"), val = tensor([1])]; tensor var_148_cast_fp16 = expand_dims(axes = var_148_axes_0, x = var_51_cast_fp16)[name = tensor("op_148_cast_fp16")]; tensor var_25_promoted_to_fp16 = const()[name = tensor("op_25_promoted_to_fp16"), val = tensor(0x0p+0)]; tensor mask_15_cast_fp16 = equal(x = var_148_cast_fp16, y = var_25_promoted_to_fp16)[name = tensor("mask_15_cast_fp16")]; tensor var_8_to_fp16 = const()[name = tensor("op_8_to_fp16"), val = tensor(-inf)]; tensor scores_3_cast_fp16 = select(a = var_8_to_fp16, b = scores_1_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_3_cast_fp16")]; tensor var_151_cast_fp16 = softmax(axis = var_20, x = scores_3_cast_fp16)[name = tensor("op_151_cast_fp16")]; tensor var_9_to_fp16 = const()[name = tensor("op_9_to_fp16"), val = tensor(0x0p+0)]; tensor input_21_cast_fp16 = select(a = var_9_to_fp16, b = var_151_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor x_13_transpose_x_0 = const()[name = tensor("x_13_transpose_x_0"), val = tensor(false)]; tensor x_13_transpose_y_0 = const()[name = tensor("x_13_transpose_y_0"), val = tensor(false)]; tensor value_1_cast_fp16 = transpose(perm = value_1_perm_0, x = var_141_cast_fp16)[name = tensor("transpose_187")]; tensor x_13_cast_fp16 = matmul(transpose_x = x_13_transpose_x_0, transpose_y = x_13_transpose_y_0, x = input_21_cast_fp16, y = value_1_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_155_perm_0 = const()[name = tensor("op_155_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_157 = const()[name = tensor("op_157"), val = tensor([1, -1, 512])]; tensor var_155_cast_fp16 = transpose(perm = var_155_perm_0, x = x_13_cast_fp16)[name = tensor("transpose_186")]; tensor input_23_cast_fp16 = reshape(shape = var_157, x = var_155_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor d_decoders_0_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_0_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2926208))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3188416))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_0_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_0_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3189504)))]; tensor linear_4_cast_fp16 = linear(bias = d_decoders_0_src_attn_linear_out_bias_to_fp16, weight = d_decoders_0_src_attn_linear_out_weight_to_fp16_quantized, x = input_23_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor input_27_cast_fp16 = add(x = input_19_cast_fp16, y = linear_4_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_axes_0 = const()[name = tensor("input_29_axes_0"), val = tensor([-1])]; tensor d_decoders_1_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_1_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3190592)))]; tensor d_decoders_1_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_1_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3191680)))]; tensor input_29_cast_fp16 = layer_norm(axes = input_29_axes_0, beta = d_decoders_1_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_1_norm1_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor d_decoders_1_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3192768))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4241408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_1_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_1_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4245568)))]; tensor linear_5_cast_fp16 = linear(bias = d_decoders_1_feed_forward_w_1_bias_to_fp16, weight = d_decoders_1_feed_forward_w_1_weight_to_fp16_quantized, x = input_29_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor input_33_cast_fp16 = relu(x = linear_5_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor input_37_axes_0 = const()[name = tensor("input_37_axes_0"), val = tensor([-1])]; tensor d_decoders_1_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_1_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4249728)))]; tensor d_decoders_1_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_1_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4253888)))]; tensor input_37_cast_fp16 = layer_norm(axes = input_37_axes_0, beta = d_decoders_1_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_1_feed_forward_norm_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor d_decoders_1_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4258048))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5306688))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_6_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_1_feed_forward_w_2_weight_to_fp16_quantized, x = input_37_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor inputs_5_axes_0 = const()[name = tensor("inputs_5_axes_0"), val = tensor([-1])]; tensor d_decoders_1_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_1_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5307776)))]; tensor d_decoders_1_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_1_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5308864)))]; tensor inputs_5_cast_fp16 = layer_norm(axes = inputs_5_axes_0, beta = d_decoders_1_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_1_norm2_weight_to_fp16, x = linear_6_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor inputs_7_cast_fp16 = mul(x = inputs_5_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor x_15_perm_0 = const()[name = tensor("x_15_perm_0"), val = tensor([0, 2, 1])]; tensor input_41_pad_0 = const()[name = tensor("input_41_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("constant")]; tensor const_11_to_fp16 = const()[name = tensor("const_11_to_fp16"), val = tensor(0x0p+0)]; tensor x_15_cast_fp16 = transpose(perm = x_15_perm_0, x = inputs_7_cast_fp16)[name = tensor("transpose_185")]; tensor input_41_cast_fp16 = pad(constant_val = const_11_to_fp16, mode = input_41_mode_0, pad = input_41_pad_0, x = x_15_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor x_17_pad_type_0 = const()[name = tensor("x_17_pad_type_0"), val = tensor("valid")]; tensor x_17_groups_0 = const()[name = tensor("x_17_groups_0"), val = tensor(512)]; tensor x_17_strides_0 = const()[name = tensor("x_17_strides_0"), val = tensor([1])]; tensor x_17_pad_0 = const()[name = tensor("x_17_pad_0"), val = tensor([0, 0])]; tensor x_17_dilations_0 = const()[name = tensor("x_17_dilations_0"), val = tensor([1])]; tensor d_decoders_1_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5309952))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5315648))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_17_cast_fp16 = conv(dilations = x_17_dilations_0, groups = x_17_groups_0, pad = x_17_pad_0, pad_type = x_17_pad_type_0, strides = x_17_strides_0, weight = d_decoders_1_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_41_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor x_19_perm_0 = const()[name = tensor("x_19_perm_0"), val = tensor([0, 2, 1])]; tensor x_19_cast_fp16 = transpose(perm = x_19_perm_0, x = x_17_cast_fp16)[name = tensor("transpose_184")]; tensor input_43_cast_fp16 = add(x = x_19_cast_fp16, y = inputs_7_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor input_45_cast_fp16 = mul(x = input_43_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor input_47_cast_fp16 = add(x = input_27_cast_fp16, y = input_45_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor x_25_axes_0 = const()[name = tensor("x_25_axes_0"), val = tensor([-1])]; tensor d_decoders_1_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_1_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5316736)))]; tensor d_decoders_1_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_1_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5317824)))]; tensor x_25_cast_fp16 = layer_norm(axes = x_25_axes_0, beta = d_decoders_1_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_1_norm3_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor d_decoders_1_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5318912))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5581120))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_1_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_1_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5582208)))]; tensor linear_7_cast_fp16 = linear(bias = d_decoders_1_src_attn_linear_q_bias_to_fp16, weight = d_decoders_1_src_attn_linear_q_weight_to_fp16_quantized, x = x_25_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_223 = const()[name = tensor("op_223"), val = tensor([1, -1, 4, 128])]; tensor var_224_cast_fp16 = reshape(shape = var_223, x = linear_7_cast_fp16)[name = tensor("op_224_cast_fp16")]; tensor d_decoders_1_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5583296))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6107648))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_1_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_1_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6109760)))]; tensor linear_8_cast_fp16 = linear(bias = d_decoders_1_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_1_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_8_cast_fp16")]; tensor tile_1 = const()[name = tensor("tile_1"), val = tensor([512, 512])]; tensor var_229_axis_0 = const()[name = tensor("op_229_axis_0"), val = tensor(-1)]; tensor var_229_cast_fp16_0, tensor var_229_cast_fp16_1 = split(axis = var_229_axis_0, split_sizes = tile_1, x = linear_8_cast_fp16)[name = tensor("op_229_cast_fp16")]; tensor var_232 = const()[name = tensor("op_232"), val = tensor([1, -1, 4, 128])]; tensor var_233_cast_fp16 = reshape(shape = var_232, x = var_229_cast_fp16_0)[name = tensor("op_233_cast_fp16")]; tensor var_235 = const()[name = tensor("op_235"), val = tensor([1, -1, 4, 128])]; tensor var_236_cast_fp16 = reshape(shape = var_235, x = var_229_cast_fp16_1)[name = tensor("op_236_cast_fp16")]; tensor value_3_perm_0 = const()[name = tensor("value_3_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_238_to_fp16 = const()[name = tensor("op_238_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_7_cast_fp16 = mul(x = var_224_cast_fp16, y = var_238_to_fp16)[name = tensor("q_h_7_cast_fp16")]; tensor scores_5_transpose_x_0 = const()[name = tensor("scores_5_transpose_x_0"), val = tensor(false)]; tensor scores_5_transpose_y_0 = const()[name = tensor("scores_5_transpose_y_0"), val = tensor(false)]; tensor transpose_66_perm_0 = const()[name = tensor("transpose_66_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_67_perm_0 = const()[name = tensor("transpose_67_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_67 = transpose(perm = transpose_67_perm_0, x = var_233_cast_fp16)[name = tensor("transpose_182")]; tensor transpose_66 = transpose(perm = transpose_66_perm_0, x = q_h_7_cast_fp16)[name = tensor("transpose_183")]; tensor scores_5_cast_fp16 = matmul(transpose_x = scores_5_transpose_x_0, transpose_y = scores_5_transpose_y_0, x = transpose_66, y = transpose_67)[name = tensor("scores_5_cast_fp16")]; tensor scores_7_cast_fp16 = select(a = var_8_to_fp16, b = scores_5_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_7_cast_fp16")]; tensor var_246_cast_fp16 = softmax(axis = var_20, x = scores_7_cast_fp16)[name = tensor("op_246_cast_fp16")]; tensor input_49_cast_fp16 = select(a = var_9_to_fp16, b = var_246_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor x_27_transpose_x_0 = const()[name = tensor("x_27_transpose_x_0"), val = tensor(false)]; tensor x_27_transpose_y_0 = const()[name = tensor("x_27_transpose_y_0"), val = tensor(false)]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = var_236_cast_fp16)[name = tensor("transpose_181")]; tensor x_27_cast_fp16 = matmul(transpose_x = x_27_transpose_x_0, transpose_y = x_27_transpose_y_0, x = input_49_cast_fp16, y = value_3_cast_fp16)[name = tensor("x_27_cast_fp16")]; tensor var_250_perm_0 = const()[name = tensor("op_250_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_252 = const()[name = tensor("op_252"), val = tensor([1, -1, 512])]; tensor var_250_cast_fp16 = transpose(perm = var_250_perm_0, x = x_27_cast_fp16)[name = tensor("transpose_180")]; tensor input_51_cast_fp16 = reshape(shape = var_252, x = var_250_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor d_decoders_1_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_1_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6111872))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6374080))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_1_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_1_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6375168)))]; tensor linear_9_cast_fp16 = linear(bias = d_decoders_1_src_attn_linear_out_bias_to_fp16, weight = d_decoders_1_src_attn_linear_out_weight_to_fp16_quantized, x = input_51_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor input_55_cast_fp16 = add(x = input_47_cast_fp16, y = linear_9_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor input_57_axes_0 = const()[name = tensor("input_57_axes_0"), val = tensor([-1])]; tensor d_decoders_2_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_2_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6376256)))]; tensor d_decoders_2_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_2_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6377344)))]; tensor input_57_cast_fp16 = layer_norm(axes = input_57_axes_0, beta = d_decoders_2_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_2_norm1_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor d_decoders_2_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6378432))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7427072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_2_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_2_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7431232)))]; tensor linear_10_cast_fp16 = linear(bias = d_decoders_2_feed_forward_w_1_bias_to_fp16, weight = d_decoders_2_feed_forward_w_1_weight_to_fp16_quantized, x = input_57_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_61_cast_fp16 = relu(x = linear_10_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor input_65_axes_0 = const()[name = tensor("input_65_axes_0"), val = tensor([-1])]; tensor d_decoders_2_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_2_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7435392)))]; tensor d_decoders_2_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_2_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7439552)))]; tensor input_65_cast_fp16 = layer_norm(axes = input_65_axes_0, beta = d_decoders_2_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_2_feed_forward_norm_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor d_decoders_2_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7443712))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8492352))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_11_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_2_feed_forward_w_2_weight_to_fp16_quantized, x = input_65_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor inputs_9_axes_0 = const()[name = tensor("inputs_9_axes_0"), val = tensor([-1])]; tensor d_decoders_2_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_2_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8493440)))]; tensor d_decoders_2_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_2_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8494528)))]; tensor inputs_9_cast_fp16 = layer_norm(axes = inputs_9_axes_0, beta = d_decoders_2_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_2_norm2_weight_to_fp16, x = linear_11_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor inputs_11_cast_fp16 = mul(x = inputs_9_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor x_29_perm_0 = const()[name = tensor("x_29_perm_0"), val = tensor([0, 2, 1])]; tensor input_69_pad_0 = const()[name = tensor("input_69_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_69_mode_0 = const()[name = tensor("input_69_mode_0"), val = tensor("constant")]; tensor const_17_to_fp16 = const()[name = tensor("const_17_to_fp16"), val = tensor(0x0p+0)]; tensor x_29_cast_fp16 = transpose(perm = x_29_perm_0, x = inputs_11_cast_fp16)[name = tensor("transpose_179")]; tensor input_69_cast_fp16 = pad(constant_val = const_17_to_fp16, mode = input_69_mode_0, pad = input_69_pad_0, x = x_29_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor x_31_pad_type_0 = const()[name = tensor("x_31_pad_type_0"), val = tensor("valid")]; tensor x_31_groups_0 = const()[name = tensor("x_31_groups_0"), val = tensor(512)]; tensor x_31_strides_0 = const()[name = tensor("x_31_strides_0"), val = tensor([1])]; tensor x_31_pad_0 = const()[name = tensor("x_31_pad_0"), val = tensor([0, 0])]; tensor x_31_dilations_0 = const()[name = tensor("x_31_dilations_0"), val = tensor([1])]; tensor d_decoders_2_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8495616))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8501312))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_31_cast_fp16 = conv(dilations = x_31_dilations_0, groups = x_31_groups_0, pad = x_31_pad_0, pad_type = x_31_pad_type_0, strides = x_31_strides_0, weight = d_decoders_2_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_69_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor x_33_perm_0 = const()[name = tensor("x_33_perm_0"), val = tensor([0, 2, 1])]; tensor x_33_cast_fp16 = transpose(perm = x_33_perm_0, x = x_31_cast_fp16)[name = tensor("transpose_178")]; tensor input_71_cast_fp16 = add(x = x_33_cast_fp16, y = inputs_11_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor input_73_cast_fp16 = mul(x = input_71_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_55_cast_fp16, y = input_73_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor x_39_axes_0 = const()[name = tensor("x_39_axes_0"), val = tensor([-1])]; tensor d_decoders_2_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_2_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8502400)))]; tensor d_decoders_2_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_2_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8503488)))]; tensor x_39_cast_fp16 = layer_norm(axes = x_39_axes_0, beta = d_decoders_2_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_2_norm3_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("x_39_cast_fp16")]; tensor d_decoders_2_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8504576))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8766784))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_2_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_2_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8767872)))]; tensor linear_12_cast_fp16 = linear(bias = d_decoders_2_src_attn_linear_q_bias_to_fp16, weight = d_decoders_2_src_attn_linear_q_weight_to_fp16_quantized, x = x_39_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_318 = const()[name = tensor("op_318"), val = tensor([1, -1, 4, 128])]; tensor var_319_cast_fp16 = reshape(shape = var_318, x = linear_12_cast_fp16)[name = tensor("op_319_cast_fp16")]; tensor d_decoders_2_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8768960))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9293312))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_2_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_2_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9295424)))]; tensor linear_13_cast_fp16 = linear(bias = d_decoders_2_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_2_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_13_cast_fp16")]; tensor tile_2 = const()[name = tensor("tile_2"), val = tensor([512, 512])]; tensor var_324_axis_0 = const()[name = tensor("op_324_axis_0"), val = tensor(-1)]; tensor var_324_cast_fp16_0, tensor var_324_cast_fp16_1 = split(axis = var_324_axis_0, split_sizes = tile_2, x = linear_13_cast_fp16)[name = tensor("op_324_cast_fp16")]; tensor var_327 = const()[name = tensor("op_327"), val = tensor([1, -1, 4, 128])]; tensor var_328_cast_fp16 = reshape(shape = var_327, x = var_324_cast_fp16_0)[name = tensor("op_328_cast_fp16")]; tensor var_330 = const()[name = tensor("op_330"), val = tensor([1, -1, 4, 128])]; tensor var_331_cast_fp16 = reshape(shape = var_330, x = var_324_cast_fp16_1)[name = tensor("op_331_cast_fp16")]; tensor value_5_perm_0 = const()[name = tensor("value_5_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_333_to_fp16 = const()[name = tensor("op_333_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_11_cast_fp16 = mul(x = var_319_cast_fp16, y = var_333_to_fp16)[name = tensor("q_h_11_cast_fp16")]; tensor scores_9_transpose_x_0 = const()[name = tensor("scores_9_transpose_x_0"), val = tensor(false)]; tensor scores_9_transpose_y_0 = const()[name = tensor("scores_9_transpose_y_0"), val = tensor(false)]; tensor transpose_68_perm_0 = const()[name = tensor("transpose_68_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_69_perm_0 = const()[name = tensor("transpose_69_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_69 = transpose(perm = transpose_69_perm_0, x = var_328_cast_fp16)[name = tensor("transpose_176")]; tensor transpose_68 = transpose(perm = transpose_68_perm_0, x = q_h_11_cast_fp16)[name = tensor("transpose_177")]; tensor scores_9_cast_fp16 = matmul(transpose_x = scores_9_transpose_x_0, transpose_y = scores_9_transpose_y_0, x = transpose_68, y = transpose_69)[name = tensor("scores_9_cast_fp16")]; tensor scores_11_cast_fp16 = select(a = var_8_to_fp16, b = scores_9_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_11_cast_fp16")]; tensor var_341_cast_fp16 = softmax(axis = var_20, x = scores_11_cast_fp16)[name = tensor("op_341_cast_fp16")]; tensor input_77_cast_fp16 = select(a = var_9_to_fp16, b = var_341_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor x_41_transpose_x_0 = const()[name = tensor("x_41_transpose_x_0"), val = tensor(false)]; tensor x_41_transpose_y_0 = const()[name = tensor("x_41_transpose_y_0"), val = tensor(false)]; tensor value_5_cast_fp16 = transpose(perm = value_5_perm_0, x = var_331_cast_fp16)[name = tensor("transpose_175")]; tensor x_41_cast_fp16 = matmul(transpose_x = x_41_transpose_x_0, transpose_y = x_41_transpose_y_0, x = input_77_cast_fp16, y = value_5_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor var_345_perm_0 = const()[name = tensor("op_345_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_347 = const()[name = tensor("op_347"), val = tensor([1, -1, 512])]; tensor var_345_cast_fp16 = transpose(perm = var_345_perm_0, x = x_41_cast_fp16)[name = tensor("transpose_174")]; tensor input_79_cast_fp16 = reshape(shape = var_347, x = var_345_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor d_decoders_2_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_2_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9297536))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9559744))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_2_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_2_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9560832)))]; tensor linear_14_cast_fp16 = linear(bias = d_decoders_2_src_attn_linear_out_bias_to_fp16, weight = d_decoders_2_src_attn_linear_out_weight_to_fp16_quantized, x = input_79_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor input_83_cast_fp16 = add(x = input_75_cast_fp16, y = linear_14_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor input_85_axes_0 = const()[name = tensor("input_85_axes_0"), val = tensor([-1])]; tensor d_decoders_3_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_3_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9561920)))]; tensor d_decoders_3_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_3_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9563008)))]; tensor input_85_cast_fp16 = layer_norm(axes = input_85_axes_0, beta = d_decoders_3_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_3_norm1_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor d_decoders_3_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9564096))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10612736))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_3_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_3_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10616896)))]; tensor linear_15_cast_fp16 = linear(bias = d_decoders_3_feed_forward_w_1_bias_to_fp16, weight = d_decoders_3_feed_forward_w_1_weight_to_fp16_quantized, x = input_85_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor input_89_cast_fp16 = relu(x = linear_15_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor input_93_axes_0 = const()[name = tensor("input_93_axes_0"), val = tensor([-1])]; tensor d_decoders_3_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_3_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10621056)))]; tensor d_decoders_3_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_3_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10625216)))]; tensor input_93_cast_fp16 = layer_norm(axes = input_93_axes_0, beta = d_decoders_3_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_3_feed_forward_norm_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor d_decoders_3_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10629376))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11678016))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_16_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_3_feed_forward_w_2_weight_to_fp16_quantized, x = input_93_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor inputs_13_axes_0 = const()[name = tensor("inputs_13_axes_0"), val = tensor([-1])]; tensor d_decoders_3_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_3_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11679104)))]; tensor d_decoders_3_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_3_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11680192)))]; tensor inputs_13_cast_fp16 = layer_norm(axes = inputs_13_axes_0, beta = d_decoders_3_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_3_norm2_weight_to_fp16, x = linear_16_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor inputs_15_cast_fp16 = mul(x = inputs_13_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor x_43_perm_0 = const()[name = tensor("x_43_perm_0"), val = tensor([0, 2, 1])]; tensor input_97_pad_0 = const()[name = tensor("input_97_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_97_mode_0 = const()[name = tensor("input_97_mode_0"), val = tensor("constant")]; tensor const_23_to_fp16 = const()[name = tensor("const_23_to_fp16"), val = tensor(0x0p+0)]; tensor x_43_cast_fp16 = transpose(perm = x_43_perm_0, x = inputs_15_cast_fp16)[name = tensor("transpose_173")]; tensor input_97_cast_fp16 = pad(constant_val = const_23_to_fp16, mode = input_97_mode_0, pad = input_97_pad_0, x = x_43_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor x_45_pad_type_0 = const()[name = tensor("x_45_pad_type_0"), val = tensor("valid")]; tensor x_45_groups_0 = const()[name = tensor("x_45_groups_0"), val = tensor(512)]; tensor x_45_strides_0 = const()[name = tensor("x_45_strides_0"), val = tensor([1])]; tensor x_45_pad_0 = const()[name = tensor("x_45_pad_0"), val = tensor([0, 0])]; tensor x_45_dilations_0 = const()[name = tensor("x_45_dilations_0"), val = tensor([1])]; tensor d_decoders_3_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11681280))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11686976))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_45_cast_fp16 = conv(dilations = x_45_dilations_0, groups = x_45_groups_0, pad = x_45_pad_0, pad_type = x_45_pad_type_0, strides = x_45_strides_0, weight = d_decoders_3_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_97_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor x_47_perm_0 = const()[name = tensor("x_47_perm_0"), val = tensor([0, 2, 1])]; tensor x_47_cast_fp16 = transpose(perm = x_47_perm_0, x = x_45_cast_fp16)[name = tensor("transpose_172")]; tensor input_99_cast_fp16 = add(x = x_47_cast_fp16, y = inputs_15_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor input_101_cast_fp16 = mul(x = input_99_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor input_103_cast_fp16 = add(x = input_83_cast_fp16, y = input_101_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor x_53_axes_0 = const()[name = tensor("x_53_axes_0"), val = tensor([-1])]; tensor d_decoders_3_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_3_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11688064)))]; tensor d_decoders_3_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_3_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11689152)))]; tensor x_53_cast_fp16 = layer_norm(axes = x_53_axes_0, beta = d_decoders_3_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_3_norm3_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor d_decoders_3_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11690240))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11952448))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_3_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_3_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11953536)))]; tensor linear_17_cast_fp16 = linear(bias = d_decoders_3_src_attn_linear_q_bias_to_fp16, weight = d_decoders_3_src_attn_linear_q_weight_to_fp16_quantized, x = x_53_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor var_413 = const()[name = tensor("op_413"), val = tensor([1, -1, 4, 128])]; tensor var_414_cast_fp16 = reshape(shape = var_413, x = linear_17_cast_fp16)[name = tensor("op_414_cast_fp16")]; tensor d_decoders_3_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11954624))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12478976))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_3_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_3_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12481088)))]; tensor linear_18_cast_fp16 = linear(bias = d_decoders_3_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_3_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_18_cast_fp16")]; tensor tile_3 = const()[name = tensor("tile_3"), val = tensor([512, 512])]; tensor var_419_axis_0 = const()[name = tensor("op_419_axis_0"), val = tensor(-1)]; tensor var_419_cast_fp16_0, tensor var_419_cast_fp16_1 = split(axis = var_419_axis_0, split_sizes = tile_3, x = linear_18_cast_fp16)[name = tensor("op_419_cast_fp16")]; tensor var_422 = const()[name = tensor("op_422"), val = tensor([1, -1, 4, 128])]; tensor var_423_cast_fp16 = reshape(shape = var_422, x = var_419_cast_fp16_0)[name = tensor("op_423_cast_fp16")]; tensor var_425 = const()[name = tensor("op_425"), val = tensor([1, -1, 4, 128])]; tensor var_426_cast_fp16 = reshape(shape = var_425, x = var_419_cast_fp16_1)[name = tensor("op_426_cast_fp16")]; tensor value_7_perm_0 = const()[name = tensor("value_7_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_428_to_fp16 = const()[name = tensor("op_428_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_15_cast_fp16 = mul(x = var_414_cast_fp16, y = var_428_to_fp16)[name = tensor("q_h_15_cast_fp16")]; tensor scores_13_transpose_x_0 = const()[name = tensor("scores_13_transpose_x_0"), val = tensor(false)]; tensor scores_13_transpose_y_0 = const()[name = tensor("scores_13_transpose_y_0"), val = tensor(false)]; tensor transpose_70_perm_0 = const()[name = tensor("transpose_70_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_71_perm_0 = const()[name = tensor("transpose_71_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_71 = transpose(perm = transpose_71_perm_0, x = var_423_cast_fp16)[name = tensor("transpose_170")]; tensor transpose_70 = transpose(perm = transpose_70_perm_0, x = q_h_15_cast_fp16)[name = tensor("transpose_171")]; tensor scores_13_cast_fp16 = matmul(transpose_x = scores_13_transpose_x_0, transpose_y = scores_13_transpose_y_0, x = transpose_70, y = transpose_71)[name = tensor("scores_13_cast_fp16")]; tensor scores_15_cast_fp16 = select(a = var_8_to_fp16, b = scores_13_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_15_cast_fp16")]; tensor var_436_cast_fp16 = softmax(axis = var_20, x = scores_15_cast_fp16)[name = tensor("op_436_cast_fp16")]; tensor input_105_cast_fp16 = select(a = var_9_to_fp16, b = var_436_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_105_cast_fp16")]; tensor x_55_transpose_x_0 = const()[name = tensor("x_55_transpose_x_0"), val = tensor(false)]; tensor x_55_transpose_y_0 = const()[name = tensor("x_55_transpose_y_0"), val = tensor(false)]; tensor value_7_cast_fp16 = transpose(perm = value_7_perm_0, x = var_426_cast_fp16)[name = tensor("transpose_169")]; tensor x_55_cast_fp16 = matmul(transpose_x = x_55_transpose_x_0, transpose_y = x_55_transpose_y_0, x = input_105_cast_fp16, y = value_7_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor var_440_perm_0 = const()[name = tensor("op_440_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_442 = const()[name = tensor("op_442"), val = tensor([1, -1, 512])]; tensor var_440_cast_fp16 = transpose(perm = var_440_perm_0, x = x_55_cast_fp16)[name = tensor("transpose_168")]; tensor input_107_cast_fp16 = reshape(shape = var_442, x = var_440_cast_fp16)[name = tensor("input_107_cast_fp16")]; tensor d_decoders_3_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_3_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12483200))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12745408))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_3_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_3_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12746496)))]; tensor linear_19_cast_fp16 = linear(bias = d_decoders_3_src_attn_linear_out_bias_to_fp16, weight = d_decoders_3_src_attn_linear_out_weight_to_fp16_quantized, x = input_107_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor input_111_cast_fp16 = add(x = input_103_cast_fp16, y = linear_19_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor input_113_axes_0 = const()[name = tensor("input_113_axes_0"), val = tensor([-1])]; tensor d_decoders_4_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_4_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12747584)))]; tensor d_decoders_4_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_4_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12748672)))]; tensor input_113_cast_fp16 = layer_norm(axes = input_113_axes_0, beta = d_decoders_4_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_4_norm1_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor d_decoders_4_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12749760))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13798400))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_4_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_4_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13802560)))]; tensor linear_20_cast_fp16 = linear(bias = d_decoders_4_feed_forward_w_1_bias_to_fp16, weight = d_decoders_4_feed_forward_w_1_weight_to_fp16_quantized, x = input_113_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor input_117_cast_fp16 = relu(x = linear_20_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor input_121_axes_0 = const()[name = tensor("input_121_axes_0"), val = tensor([-1])]; tensor d_decoders_4_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_4_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13806720)))]; tensor d_decoders_4_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_4_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13810880)))]; tensor input_121_cast_fp16 = layer_norm(axes = input_121_axes_0, beta = d_decoders_4_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_4_feed_forward_norm_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor d_decoders_4_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13815040))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14863680))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_21_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_4_feed_forward_w_2_weight_to_fp16_quantized, x = input_121_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor inputs_17_axes_0 = const()[name = tensor("inputs_17_axes_0"), val = tensor([-1])]; tensor d_decoders_4_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_4_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14864768)))]; tensor d_decoders_4_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_4_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14865856)))]; tensor inputs_17_cast_fp16 = layer_norm(axes = inputs_17_axes_0, beta = d_decoders_4_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_4_norm2_weight_to_fp16, x = linear_21_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; tensor inputs_19_cast_fp16 = mul(x = inputs_17_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; tensor x_57_perm_0 = const()[name = tensor("x_57_perm_0"), val = tensor([0, 2, 1])]; tensor input_125_pad_0 = const()[name = tensor("input_125_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_125_mode_0 = const()[name = tensor("input_125_mode_0"), val = tensor("constant")]; tensor const_29_to_fp16 = const()[name = tensor("const_29_to_fp16"), val = tensor(0x0p+0)]; tensor x_57_cast_fp16 = transpose(perm = x_57_perm_0, x = inputs_19_cast_fp16)[name = tensor("transpose_167")]; tensor input_125_cast_fp16 = pad(constant_val = const_29_to_fp16, mode = input_125_mode_0, pad = input_125_pad_0, x = x_57_cast_fp16)[name = tensor("input_125_cast_fp16")]; tensor x_59_pad_type_0 = const()[name = tensor("x_59_pad_type_0"), val = tensor("valid")]; tensor x_59_groups_0 = const()[name = tensor("x_59_groups_0"), val = tensor(512)]; tensor x_59_strides_0 = const()[name = tensor("x_59_strides_0"), val = tensor([1])]; tensor x_59_pad_0 = const()[name = tensor("x_59_pad_0"), val = tensor([0, 0])]; tensor x_59_dilations_0 = const()[name = tensor("x_59_dilations_0"), val = tensor([1])]; tensor d_decoders_4_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14866944))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14872640))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_59_cast_fp16 = conv(dilations = x_59_dilations_0, groups = x_59_groups_0, pad = x_59_pad_0, pad_type = x_59_pad_type_0, strides = x_59_strides_0, weight = d_decoders_4_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_125_cast_fp16)[name = tensor("x_59_cast_fp16")]; tensor x_61_perm_0 = const()[name = tensor("x_61_perm_0"), val = tensor([0, 2, 1])]; tensor x_61_cast_fp16 = transpose(perm = x_61_perm_0, x = x_59_cast_fp16)[name = tensor("transpose_166")]; tensor input_127_cast_fp16 = add(x = x_61_cast_fp16, y = inputs_19_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor input_129_cast_fp16 = mul(x = input_127_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor input_131_cast_fp16 = add(x = input_111_cast_fp16, y = input_129_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor x_67_axes_0 = const()[name = tensor("x_67_axes_0"), val = tensor([-1])]; tensor d_decoders_4_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_4_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14873728)))]; tensor d_decoders_4_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_4_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14874816)))]; tensor x_67_cast_fp16 = layer_norm(axes = x_67_axes_0, beta = d_decoders_4_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_4_norm3_weight_to_fp16, x = input_131_cast_fp16)[name = tensor("x_67_cast_fp16")]; tensor d_decoders_4_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14875904))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15138112))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_4_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_4_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15139200)))]; tensor linear_22_cast_fp16 = linear(bias = d_decoders_4_src_attn_linear_q_bias_to_fp16, weight = d_decoders_4_src_attn_linear_q_weight_to_fp16_quantized, x = x_67_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor var_508 = const()[name = tensor("op_508"), val = tensor([1, -1, 4, 128])]; tensor var_509_cast_fp16 = reshape(shape = var_508, x = linear_22_cast_fp16)[name = tensor("op_509_cast_fp16")]; tensor d_decoders_4_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15140288))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15664640))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_4_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_4_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15666752)))]; tensor linear_23_cast_fp16 = linear(bias = d_decoders_4_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_4_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_23_cast_fp16")]; tensor tile_4 = const()[name = tensor("tile_4"), val = tensor([512, 512])]; tensor var_514_axis_0 = const()[name = tensor("op_514_axis_0"), val = tensor(-1)]; tensor var_514_cast_fp16_0, tensor var_514_cast_fp16_1 = split(axis = var_514_axis_0, split_sizes = tile_4, x = linear_23_cast_fp16)[name = tensor("op_514_cast_fp16")]; tensor var_517 = const()[name = tensor("op_517"), val = tensor([1, -1, 4, 128])]; tensor var_518_cast_fp16 = reshape(shape = var_517, x = var_514_cast_fp16_0)[name = tensor("op_518_cast_fp16")]; tensor var_520 = const()[name = tensor("op_520"), val = tensor([1, -1, 4, 128])]; tensor var_521_cast_fp16 = reshape(shape = var_520, x = var_514_cast_fp16_1)[name = tensor("op_521_cast_fp16")]; tensor value_9_perm_0 = const()[name = tensor("value_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_523_to_fp16 = const()[name = tensor("op_523_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_19_cast_fp16 = mul(x = var_509_cast_fp16, y = var_523_to_fp16)[name = tensor("q_h_19_cast_fp16")]; tensor scores_17_transpose_x_0 = const()[name = tensor("scores_17_transpose_x_0"), val = tensor(false)]; tensor scores_17_transpose_y_0 = const()[name = tensor("scores_17_transpose_y_0"), val = tensor(false)]; tensor transpose_72_perm_0 = const()[name = tensor("transpose_72_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_73_perm_0 = const()[name = tensor("transpose_73_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_73 = transpose(perm = transpose_73_perm_0, x = var_518_cast_fp16)[name = tensor("transpose_164")]; tensor transpose_72 = transpose(perm = transpose_72_perm_0, x = q_h_19_cast_fp16)[name = tensor("transpose_165")]; tensor scores_17_cast_fp16 = matmul(transpose_x = scores_17_transpose_x_0, transpose_y = scores_17_transpose_y_0, x = transpose_72, y = transpose_73)[name = tensor("scores_17_cast_fp16")]; tensor scores_19_cast_fp16 = select(a = var_8_to_fp16, b = scores_17_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_19_cast_fp16")]; tensor var_531_cast_fp16 = softmax(axis = var_20, x = scores_19_cast_fp16)[name = tensor("op_531_cast_fp16")]; tensor input_133_cast_fp16 = select(a = var_9_to_fp16, b = var_531_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor x_69_transpose_x_0 = const()[name = tensor("x_69_transpose_x_0"), val = tensor(false)]; tensor x_69_transpose_y_0 = const()[name = tensor("x_69_transpose_y_0"), val = tensor(false)]; tensor value_9_cast_fp16 = transpose(perm = value_9_perm_0, x = var_521_cast_fp16)[name = tensor("transpose_163")]; tensor x_69_cast_fp16 = matmul(transpose_x = x_69_transpose_x_0, transpose_y = x_69_transpose_y_0, x = input_133_cast_fp16, y = value_9_cast_fp16)[name = tensor("x_69_cast_fp16")]; tensor var_535_perm_0 = const()[name = tensor("op_535_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_537 = const()[name = tensor("op_537"), val = tensor([1, -1, 512])]; tensor var_535_cast_fp16 = transpose(perm = var_535_perm_0, x = x_69_cast_fp16)[name = tensor("transpose_162")]; tensor input_135_cast_fp16 = reshape(shape = var_537, x = var_535_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor d_decoders_4_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_4_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15668864))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15931072))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_4_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_4_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15932160)))]; tensor linear_24_cast_fp16 = linear(bias = d_decoders_4_src_attn_linear_out_bias_to_fp16, weight = d_decoders_4_src_attn_linear_out_weight_to_fp16_quantized, x = input_135_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor input_139_cast_fp16 = add(x = input_131_cast_fp16, y = linear_24_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor input_141_axes_0 = const()[name = tensor("input_141_axes_0"), val = tensor([-1])]; tensor d_decoders_5_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_5_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15933248)))]; tensor d_decoders_5_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_5_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15934336)))]; tensor input_141_cast_fp16 = layer_norm(axes = input_141_axes_0, beta = d_decoders_5_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_5_norm1_weight_to_fp16, x = input_139_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor d_decoders_5_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15935424))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16984064))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_5_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_5_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16988224)))]; tensor linear_25_cast_fp16 = linear(bias = d_decoders_5_feed_forward_w_1_bias_to_fp16, weight = d_decoders_5_feed_forward_w_1_weight_to_fp16_quantized, x = input_141_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor input_145_cast_fp16 = relu(x = linear_25_cast_fp16)[name = tensor("input_145_cast_fp16")]; tensor input_149_axes_0 = const()[name = tensor("input_149_axes_0"), val = tensor([-1])]; tensor d_decoders_5_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_5_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16992384)))]; tensor d_decoders_5_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_5_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16996544)))]; tensor input_149_cast_fp16 = layer_norm(axes = input_149_axes_0, beta = d_decoders_5_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_5_feed_forward_norm_weight_to_fp16, x = input_145_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor d_decoders_5_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17000704))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18049344))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_26_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_5_feed_forward_w_2_weight_to_fp16_quantized, x = input_149_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor inputs_21_axes_0 = const()[name = tensor("inputs_21_axes_0"), val = tensor([-1])]; tensor d_decoders_5_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_5_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18050432)))]; tensor d_decoders_5_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_5_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18051520)))]; tensor inputs_21_cast_fp16 = layer_norm(axes = inputs_21_axes_0, beta = d_decoders_5_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_5_norm2_weight_to_fp16, x = linear_26_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; tensor inputs_23_cast_fp16 = mul(x = inputs_21_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; tensor x_71_perm_0 = const()[name = tensor("x_71_perm_0"), val = tensor([0, 2, 1])]; tensor input_153_pad_0 = const()[name = tensor("input_153_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_153_mode_0 = const()[name = tensor("input_153_mode_0"), val = tensor("constant")]; tensor const_35_to_fp16 = const()[name = tensor("const_35_to_fp16"), val = tensor(0x0p+0)]; tensor x_71_cast_fp16 = transpose(perm = x_71_perm_0, x = inputs_23_cast_fp16)[name = tensor("transpose_161")]; tensor input_153_cast_fp16 = pad(constant_val = const_35_to_fp16, mode = input_153_mode_0, pad = input_153_pad_0, x = x_71_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor x_73_pad_type_0 = const()[name = tensor("x_73_pad_type_0"), val = tensor("valid")]; tensor x_73_groups_0 = const()[name = tensor("x_73_groups_0"), val = tensor(512)]; tensor x_73_strides_0 = const()[name = tensor("x_73_strides_0"), val = tensor([1])]; tensor x_73_pad_0 = const()[name = tensor("x_73_pad_0"), val = tensor([0, 0])]; tensor x_73_dilations_0 = const()[name = tensor("x_73_dilations_0"), val = tensor([1])]; tensor d_decoders_5_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18052608))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18058304))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_73_cast_fp16 = conv(dilations = x_73_dilations_0, groups = x_73_groups_0, pad = x_73_pad_0, pad_type = x_73_pad_type_0, strides = x_73_strides_0, weight = d_decoders_5_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_153_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor x_75_perm_0 = const()[name = tensor("x_75_perm_0"), val = tensor([0, 2, 1])]; tensor x_75_cast_fp16 = transpose(perm = x_75_perm_0, x = x_73_cast_fp16)[name = tensor("transpose_160")]; tensor input_155_cast_fp16 = add(x = x_75_cast_fp16, y = inputs_23_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor input_157_cast_fp16 = mul(x = input_155_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_157_cast_fp16")]; tensor input_159_cast_fp16 = add(x = input_139_cast_fp16, y = input_157_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor x_81_axes_0 = const()[name = tensor("x_81_axes_0"), val = tensor([-1])]; tensor d_decoders_5_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_5_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18059392)))]; tensor d_decoders_5_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_5_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18060480)))]; tensor x_81_cast_fp16 = layer_norm(axes = x_81_axes_0, beta = d_decoders_5_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_5_norm3_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("x_81_cast_fp16")]; tensor d_decoders_5_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18061568))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18323776))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_5_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_5_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18324864)))]; tensor linear_27_cast_fp16 = linear(bias = d_decoders_5_src_attn_linear_q_bias_to_fp16, weight = d_decoders_5_src_attn_linear_q_weight_to_fp16_quantized, x = x_81_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor var_603 = const()[name = tensor("op_603"), val = tensor([1, -1, 4, 128])]; tensor var_604_cast_fp16 = reshape(shape = var_603, x = linear_27_cast_fp16)[name = tensor("op_604_cast_fp16")]; tensor d_decoders_5_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18325952))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18850304))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_5_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_5_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18852416)))]; tensor linear_28_cast_fp16 = linear(bias = d_decoders_5_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_5_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_28_cast_fp16")]; tensor tile_5 = const()[name = tensor("tile_5"), val = tensor([512, 512])]; tensor var_609_axis_0 = const()[name = tensor("op_609_axis_0"), val = tensor(-1)]; tensor var_609_cast_fp16_0, tensor var_609_cast_fp16_1 = split(axis = var_609_axis_0, split_sizes = tile_5, x = linear_28_cast_fp16)[name = tensor("op_609_cast_fp16")]; tensor var_612 = const()[name = tensor("op_612"), val = tensor([1, -1, 4, 128])]; tensor var_613_cast_fp16 = reshape(shape = var_612, x = var_609_cast_fp16_0)[name = tensor("op_613_cast_fp16")]; tensor var_615 = const()[name = tensor("op_615"), val = tensor([1, -1, 4, 128])]; tensor var_616_cast_fp16 = reshape(shape = var_615, x = var_609_cast_fp16_1)[name = tensor("op_616_cast_fp16")]; tensor value_11_perm_0 = const()[name = tensor("value_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_618_to_fp16 = const()[name = tensor("op_618_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_23_cast_fp16 = mul(x = var_604_cast_fp16, y = var_618_to_fp16)[name = tensor("q_h_23_cast_fp16")]; tensor scores_21_transpose_x_0 = const()[name = tensor("scores_21_transpose_x_0"), val = tensor(false)]; tensor scores_21_transpose_y_0 = const()[name = tensor("scores_21_transpose_y_0"), val = tensor(false)]; tensor transpose_74_perm_0 = const()[name = tensor("transpose_74_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_75_perm_0 = const()[name = tensor("transpose_75_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_75 = transpose(perm = transpose_75_perm_0, x = var_613_cast_fp16)[name = tensor("transpose_158")]; tensor transpose_74 = transpose(perm = transpose_74_perm_0, x = q_h_23_cast_fp16)[name = tensor("transpose_159")]; tensor scores_21_cast_fp16 = matmul(transpose_x = scores_21_transpose_x_0, transpose_y = scores_21_transpose_y_0, x = transpose_74, y = transpose_75)[name = tensor("scores_21_cast_fp16")]; tensor scores_23_cast_fp16 = select(a = var_8_to_fp16, b = scores_21_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_23_cast_fp16")]; tensor var_626_cast_fp16 = softmax(axis = var_20, x = scores_23_cast_fp16)[name = tensor("op_626_cast_fp16")]; tensor input_161_cast_fp16 = select(a = var_9_to_fp16, b = var_626_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor x_83_transpose_x_0 = const()[name = tensor("x_83_transpose_x_0"), val = tensor(false)]; tensor x_83_transpose_y_0 = const()[name = tensor("x_83_transpose_y_0"), val = tensor(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = var_616_cast_fp16)[name = tensor("transpose_157")]; tensor x_83_cast_fp16 = matmul(transpose_x = x_83_transpose_x_0, transpose_y = x_83_transpose_y_0, x = input_161_cast_fp16, y = value_11_cast_fp16)[name = tensor("x_83_cast_fp16")]; tensor var_630_perm_0 = const()[name = tensor("op_630_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_632 = const()[name = tensor("op_632"), val = tensor([1, -1, 512])]; tensor var_630_cast_fp16 = transpose(perm = var_630_perm_0, x = x_83_cast_fp16)[name = tensor("transpose_156")]; tensor input_163_cast_fp16 = reshape(shape = var_632, x = var_630_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor d_decoders_5_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_5_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18854528))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19116736))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_5_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_5_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19117824)))]; tensor linear_29_cast_fp16 = linear(bias = d_decoders_5_src_attn_linear_out_bias_to_fp16, weight = d_decoders_5_src_attn_linear_out_weight_to_fp16_quantized, x = input_163_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor input_167_cast_fp16 = add(x = input_159_cast_fp16, y = linear_29_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor input_169_axes_0 = const()[name = tensor("input_169_axes_0"), val = tensor([-1])]; tensor d_decoders_6_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_6_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19118912)))]; tensor d_decoders_6_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_6_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19120000)))]; tensor input_169_cast_fp16 = layer_norm(axes = input_169_axes_0, beta = d_decoders_6_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_6_norm1_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor d_decoders_6_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19121088))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20169728))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_6_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_6_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20173888)))]; tensor linear_30_cast_fp16 = linear(bias = d_decoders_6_feed_forward_w_1_bias_to_fp16, weight = d_decoders_6_feed_forward_w_1_weight_to_fp16_quantized, x = input_169_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor input_173_cast_fp16 = relu(x = linear_30_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor input_177_axes_0 = const()[name = tensor("input_177_axes_0"), val = tensor([-1])]; tensor d_decoders_6_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_6_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20178048)))]; tensor d_decoders_6_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_6_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20182208)))]; tensor input_177_cast_fp16 = layer_norm(axes = input_177_axes_0, beta = d_decoders_6_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_6_feed_forward_norm_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("input_177_cast_fp16")]; tensor d_decoders_6_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20186368))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21235008))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_6_feed_forward_w_2_weight_to_fp16_quantized, x = input_177_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor inputs_25_axes_0 = const()[name = tensor("inputs_25_axes_0"), val = tensor([-1])]; tensor d_decoders_6_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_6_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21236096)))]; tensor d_decoders_6_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_6_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21237184)))]; tensor inputs_25_cast_fp16 = layer_norm(axes = inputs_25_axes_0, beta = d_decoders_6_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_6_norm2_weight_to_fp16, x = linear_31_cast_fp16)[name = tensor("inputs_25_cast_fp16")]; tensor inputs_27_cast_fp16 = mul(x = inputs_25_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_27_cast_fp16")]; tensor x_85_perm_0 = const()[name = tensor("x_85_perm_0"), val = tensor([0, 2, 1])]; tensor input_181_pad_0 = const()[name = tensor("input_181_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_181_mode_0 = const()[name = tensor("input_181_mode_0"), val = tensor("constant")]; tensor const_41_to_fp16 = const()[name = tensor("const_41_to_fp16"), val = tensor(0x0p+0)]; tensor x_85_cast_fp16 = transpose(perm = x_85_perm_0, x = inputs_27_cast_fp16)[name = tensor("transpose_155")]; tensor input_181_cast_fp16 = pad(constant_val = const_41_to_fp16, mode = input_181_mode_0, pad = input_181_pad_0, x = x_85_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor x_87_pad_type_0 = const()[name = tensor("x_87_pad_type_0"), val = tensor("valid")]; tensor x_87_groups_0 = const()[name = tensor("x_87_groups_0"), val = tensor(512)]; tensor x_87_strides_0 = const()[name = tensor("x_87_strides_0"), val = tensor([1])]; tensor x_87_pad_0 = const()[name = tensor("x_87_pad_0"), val = tensor([0, 0])]; tensor x_87_dilations_0 = const()[name = tensor("x_87_dilations_0"), val = tensor([1])]; tensor d_decoders_6_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21238272))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21243968))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_87_cast_fp16 = conv(dilations = x_87_dilations_0, groups = x_87_groups_0, pad = x_87_pad_0, pad_type = x_87_pad_type_0, strides = x_87_strides_0, weight = d_decoders_6_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_181_cast_fp16)[name = tensor("x_87_cast_fp16")]; tensor x_89_perm_0 = const()[name = tensor("x_89_perm_0"), val = tensor([0, 2, 1])]; tensor x_89_cast_fp16 = transpose(perm = x_89_perm_0, x = x_87_cast_fp16)[name = tensor("transpose_154")]; tensor input_183_cast_fp16 = add(x = x_89_cast_fp16, y = inputs_27_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor input_185_cast_fp16 = mul(x = input_183_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_185_cast_fp16")]; tensor input_187_cast_fp16 = add(x = input_167_cast_fp16, y = input_185_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor x_95_axes_0 = const()[name = tensor("x_95_axes_0"), val = tensor([-1])]; tensor d_decoders_6_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_6_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21245056)))]; tensor d_decoders_6_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_6_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21246144)))]; tensor x_95_cast_fp16 = layer_norm(axes = x_95_axes_0, beta = d_decoders_6_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_6_norm3_weight_to_fp16, x = input_187_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor d_decoders_6_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21247232))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21509440))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_6_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_6_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21510528)))]; tensor linear_32_cast_fp16 = linear(bias = d_decoders_6_src_attn_linear_q_bias_to_fp16, weight = d_decoders_6_src_attn_linear_q_weight_to_fp16_quantized, x = x_95_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_698 = const()[name = tensor("op_698"), val = tensor([1, -1, 4, 128])]; tensor var_699_cast_fp16 = reshape(shape = var_698, x = linear_32_cast_fp16)[name = tensor("op_699_cast_fp16")]; tensor d_decoders_6_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21511616))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22035968))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_6_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_6_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22038080)))]; tensor linear_33_cast_fp16 = linear(bias = d_decoders_6_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_6_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_33_cast_fp16")]; tensor tile_6 = const()[name = tensor("tile_6"), val = tensor([512, 512])]; tensor var_704_axis_0 = const()[name = tensor("op_704_axis_0"), val = tensor(-1)]; tensor var_704_cast_fp16_0, tensor var_704_cast_fp16_1 = split(axis = var_704_axis_0, split_sizes = tile_6, x = linear_33_cast_fp16)[name = tensor("op_704_cast_fp16")]; tensor var_707 = const()[name = tensor("op_707"), val = tensor([1, -1, 4, 128])]; tensor var_708_cast_fp16 = reshape(shape = var_707, x = var_704_cast_fp16_0)[name = tensor("op_708_cast_fp16")]; tensor var_710 = const()[name = tensor("op_710"), val = tensor([1, -1, 4, 128])]; tensor var_711_cast_fp16 = reshape(shape = var_710, x = var_704_cast_fp16_1)[name = tensor("op_711_cast_fp16")]; tensor value_13_perm_0 = const()[name = tensor("value_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_713_to_fp16 = const()[name = tensor("op_713_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_27_cast_fp16 = mul(x = var_699_cast_fp16, y = var_713_to_fp16)[name = tensor("q_h_27_cast_fp16")]; tensor scores_25_transpose_x_0 = const()[name = tensor("scores_25_transpose_x_0"), val = tensor(false)]; tensor scores_25_transpose_y_0 = const()[name = tensor("scores_25_transpose_y_0"), val = tensor(false)]; tensor transpose_76_perm_0 = const()[name = tensor("transpose_76_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_77_perm_0 = const()[name = tensor("transpose_77_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_77 = transpose(perm = transpose_77_perm_0, x = var_708_cast_fp16)[name = tensor("transpose_152")]; tensor transpose_76 = transpose(perm = transpose_76_perm_0, x = q_h_27_cast_fp16)[name = tensor("transpose_153")]; tensor scores_25_cast_fp16 = matmul(transpose_x = scores_25_transpose_x_0, transpose_y = scores_25_transpose_y_0, x = transpose_76, y = transpose_77)[name = tensor("scores_25_cast_fp16")]; tensor scores_27_cast_fp16 = select(a = var_8_to_fp16, b = scores_25_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_27_cast_fp16")]; tensor var_721_cast_fp16 = softmax(axis = var_20, x = scores_27_cast_fp16)[name = tensor("op_721_cast_fp16")]; tensor input_189_cast_fp16 = select(a = var_9_to_fp16, b = var_721_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor x_97_transpose_x_0 = const()[name = tensor("x_97_transpose_x_0"), val = tensor(false)]; tensor x_97_transpose_y_0 = const()[name = tensor("x_97_transpose_y_0"), val = tensor(false)]; tensor value_13_cast_fp16 = transpose(perm = value_13_perm_0, x = var_711_cast_fp16)[name = tensor("transpose_151")]; tensor x_97_cast_fp16 = matmul(transpose_x = x_97_transpose_x_0, transpose_y = x_97_transpose_y_0, x = input_189_cast_fp16, y = value_13_cast_fp16)[name = tensor("x_97_cast_fp16")]; tensor var_725_perm_0 = const()[name = tensor("op_725_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_727 = const()[name = tensor("op_727"), val = tensor([1, -1, 512])]; tensor var_725_cast_fp16 = transpose(perm = var_725_perm_0, x = x_97_cast_fp16)[name = tensor("transpose_150")]; tensor input_191_cast_fp16 = reshape(shape = var_727, x = var_725_cast_fp16)[name = tensor("input_191_cast_fp16")]; tensor d_decoders_6_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_6_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22040192))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22302400))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_6_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_6_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22303488)))]; tensor linear_34_cast_fp16 = linear(bias = d_decoders_6_src_attn_linear_out_bias_to_fp16, weight = d_decoders_6_src_attn_linear_out_weight_to_fp16_quantized, x = input_191_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_195_cast_fp16 = add(x = input_187_cast_fp16, y = linear_34_cast_fp16)[name = tensor("input_195_cast_fp16")]; tensor input_197_axes_0 = const()[name = tensor("input_197_axes_0"), val = tensor([-1])]; tensor d_decoders_7_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_7_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22304576)))]; tensor d_decoders_7_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_7_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22305664)))]; tensor input_197_cast_fp16 = layer_norm(axes = input_197_axes_0, beta = d_decoders_7_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_7_norm1_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor d_decoders_7_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22306752))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23355392))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_7_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_7_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23359552)))]; tensor linear_35_cast_fp16 = linear(bias = d_decoders_7_feed_forward_w_1_bias_to_fp16, weight = d_decoders_7_feed_forward_w_1_weight_to_fp16_quantized, x = input_197_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_201_cast_fp16 = relu(x = linear_35_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor input_205_axes_0 = const()[name = tensor("input_205_axes_0"), val = tensor([-1])]; tensor d_decoders_7_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_7_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23363712)))]; tensor d_decoders_7_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_7_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23367872)))]; tensor input_205_cast_fp16 = layer_norm(axes = input_205_axes_0, beta = d_decoders_7_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_7_feed_forward_norm_weight_to_fp16, x = input_201_cast_fp16)[name = tensor("input_205_cast_fp16")]; tensor d_decoders_7_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23372032))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24420672))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_36_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_7_feed_forward_w_2_weight_to_fp16_quantized, x = input_205_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor inputs_29_axes_0 = const()[name = tensor("inputs_29_axes_0"), val = tensor([-1])]; tensor d_decoders_7_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_7_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24421760)))]; tensor d_decoders_7_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_7_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24422848)))]; tensor inputs_29_cast_fp16 = layer_norm(axes = inputs_29_axes_0, beta = d_decoders_7_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_7_norm2_weight_to_fp16, x = linear_36_cast_fp16)[name = tensor("inputs_29_cast_fp16")]; tensor inputs_31_cast_fp16 = mul(x = inputs_29_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_31_cast_fp16")]; tensor x_99_perm_0 = const()[name = tensor("x_99_perm_0"), val = tensor([0, 2, 1])]; tensor input_209_pad_0 = const()[name = tensor("input_209_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_209_mode_0 = const()[name = tensor("input_209_mode_0"), val = tensor("constant")]; tensor const_47_to_fp16 = const()[name = tensor("const_47_to_fp16"), val = tensor(0x0p+0)]; tensor x_99_cast_fp16 = transpose(perm = x_99_perm_0, x = inputs_31_cast_fp16)[name = tensor("transpose_149")]; tensor input_209_cast_fp16 = pad(constant_val = const_47_to_fp16, mode = input_209_mode_0, pad = input_209_pad_0, x = x_99_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor x_101_pad_type_0 = const()[name = tensor("x_101_pad_type_0"), val = tensor("valid")]; tensor x_101_groups_0 = const()[name = tensor("x_101_groups_0"), val = tensor(512)]; tensor x_101_strides_0 = const()[name = tensor("x_101_strides_0"), val = tensor([1])]; tensor x_101_pad_0 = const()[name = tensor("x_101_pad_0"), val = tensor([0, 0])]; tensor x_101_dilations_0 = const()[name = tensor("x_101_dilations_0"), val = tensor([1])]; tensor d_decoders_7_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24423936))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24429632))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_101_cast_fp16 = conv(dilations = x_101_dilations_0, groups = x_101_groups_0, pad = x_101_pad_0, pad_type = x_101_pad_type_0, strides = x_101_strides_0, weight = d_decoders_7_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_209_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor x_103_perm_0 = const()[name = tensor("x_103_perm_0"), val = tensor([0, 2, 1])]; tensor x_103_cast_fp16 = transpose(perm = x_103_perm_0, x = x_101_cast_fp16)[name = tensor("transpose_148")]; tensor input_211_cast_fp16 = add(x = x_103_cast_fp16, y = inputs_31_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor input_213_cast_fp16 = mul(x = input_211_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor input_215_cast_fp16 = add(x = input_195_cast_fp16, y = input_213_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor x_109_axes_0 = const()[name = tensor("x_109_axes_0"), val = tensor([-1])]; tensor d_decoders_7_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_7_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24430720)))]; tensor d_decoders_7_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_7_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24431808)))]; tensor x_109_cast_fp16 = layer_norm(axes = x_109_axes_0, beta = d_decoders_7_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_7_norm3_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("x_109_cast_fp16")]; tensor d_decoders_7_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24432896))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24695104))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_7_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_7_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24696192)))]; tensor linear_37_cast_fp16 = linear(bias = d_decoders_7_src_attn_linear_q_bias_to_fp16, weight = d_decoders_7_src_attn_linear_q_weight_to_fp16_quantized, x = x_109_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor var_793 = const()[name = tensor("op_793"), val = tensor([1, -1, 4, 128])]; tensor var_794_cast_fp16 = reshape(shape = var_793, x = linear_37_cast_fp16)[name = tensor("op_794_cast_fp16")]; tensor d_decoders_7_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24697280))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25221632))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_7_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_7_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25223744)))]; tensor linear_38_cast_fp16 = linear(bias = d_decoders_7_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_7_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_38_cast_fp16")]; tensor tile_7 = const()[name = tensor("tile_7"), val = tensor([512, 512])]; tensor var_799_axis_0 = const()[name = tensor("op_799_axis_0"), val = tensor(-1)]; tensor var_799_cast_fp16_0, tensor var_799_cast_fp16_1 = split(axis = var_799_axis_0, split_sizes = tile_7, x = linear_38_cast_fp16)[name = tensor("op_799_cast_fp16")]; tensor var_802 = const()[name = tensor("op_802"), val = tensor([1, -1, 4, 128])]; tensor var_803_cast_fp16 = reshape(shape = var_802, x = var_799_cast_fp16_0)[name = tensor("op_803_cast_fp16")]; tensor var_805 = const()[name = tensor("op_805"), val = tensor([1, -1, 4, 128])]; tensor var_806_cast_fp16 = reshape(shape = var_805, x = var_799_cast_fp16_1)[name = tensor("op_806_cast_fp16")]; tensor value_15_perm_0 = const()[name = tensor("value_15_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_808_to_fp16 = const()[name = tensor("op_808_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_31_cast_fp16 = mul(x = var_794_cast_fp16, y = var_808_to_fp16)[name = tensor("q_h_31_cast_fp16")]; tensor scores_29_transpose_x_0 = const()[name = tensor("scores_29_transpose_x_0"), val = tensor(false)]; tensor scores_29_transpose_y_0 = const()[name = tensor("scores_29_transpose_y_0"), val = tensor(false)]; tensor transpose_78_perm_0 = const()[name = tensor("transpose_78_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_79_perm_0 = const()[name = tensor("transpose_79_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_79 = transpose(perm = transpose_79_perm_0, x = var_803_cast_fp16)[name = tensor("transpose_146")]; tensor transpose_78 = transpose(perm = transpose_78_perm_0, x = q_h_31_cast_fp16)[name = tensor("transpose_147")]; tensor scores_29_cast_fp16 = matmul(transpose_x = scores_29_transpose_x_0, transpose_y = scores_29_transpose_y_0, x = transpose_78, y = transpose_79)[name = tensor("scores_29_cast_fp16")]; tensor scores_31_cast_fp16 = select(a = var_8_to_fp16, b = scores_29_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_31_cast_fp16")]; tensor var_816_cast_fp16 = softmax(axis = var_20, x = scores_31_cast_fp16)[name = tensor("op_816_cast_fp16")]; tensor input_217_cast_fp16 = select(a = var_9_to_fp16, b = var_816_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_217_cast_fp16")]; tensor x_111_transpose_x_0 = const()[name = tensor("x_111_transpose_x_0"), val = tensor(false)]; tensor x_111_transpose_y_0 = const()[name = tensor("x_111_transpose_y_0"), val = tensor(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = var_806_cast_fp16)[name = tensor("transpose_145")]; tensor x_111_cast_fp16 = matmul(transpose_x = x_111_transpose_x_0, transpose_y = x_111_transpose_y_0, x = input_217_cast_fp16, y = value_15_cast_fp16)[name = tensor("x_111_cast_fp16")]; tensor var_820_perm_0 = const()[name = tensor("op_820_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_822 = const()[name = tensor("op_822"), val = tensor([1, -1, 512])]; tensor var_820_cast_fp16 = transpose(perm = var_820_perm_0, x = x_111_cast_fp16)[name = tensor("transpose_144")]; tensor input_219_cast_fp16 = reshape(shape = var_822, x = var_820_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor d_decoders_7_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_7_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25225856))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25488064))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_7_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_7_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25489152)))]; tensor linear_39_cast_fp16 = linear(bias = d_decoders_7_src_attn_linear_out_bias_to_fp16, weight = d_decoders_7_src_attn_linear_out_weight_to_fp16_quantized, x = input_219_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor input_223_cast_fp16 = add(x = input_215_cast_fp16, y = linear_39_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor input_225_axes_0 = const()[name = tensor("input_225_axes_0"), val = tensor([-1])]; tensor d_decoders_8_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_8_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25490240)))]; tensor d_decoders_8_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_8_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25491328)))]; tensor input_225_cast_fp16 = layer_norm(axes = input_225_axes_0, beta = d_decoders_8_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_8_norm1_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor d_decoders_8_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25492416))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26541056))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_8_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_8_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26545216)))]; tensor linear_40_cast_fp16 = linear(bias = d_decoders_8_feed_forward_w_1_bias_to_fp16, weight = d_decoders_8_feed_forward_w_1_weight_to_fp16_quantized, x = input_225_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor input_229_cast_fp16 = relu(x = linear_40_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor input_233_axes_0 = const()[name = tensor("input_233_axes_0"), val = tensor([-1])]; tensor d_decoders_8_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_8_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26549376)))]; tensor d_decoders_8_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_8_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26553536)))]; tensor input_233_cast_fp16 = layer_norm(axes = input_233_axes_0, beta = d_decoders_8_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_8_feed_forward_norm_weight_to_fp16, x = input_229_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor d_decoders_8_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26557696))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27606336))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_41_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_8_feed_forward_w_2_weight_to_fp16_quantized, x = input_233_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor inputs_33_axes_0 = const()[name = tensor("inputs_33_axes_0"), val = tensor([-1])]; tensor d_decoders_8_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_8_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27607424)))]; tensor d_decoders_8_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_8_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27608512)))]; tensor inputs_33_cast_fp16 = layer_norm(axes = inputs_33_axes_0, beta = d_decoders_8_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_8_norm2_weight_to_fp16, x = linear_41_cast_fp16)[name = tensor("inputs_33_cast_fp16")]; tensor inputs_35_cast_fp16 = mul(x = inputs_33_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_35_cast_fp16")]; tensor x_113_perm_0 = const()[name = tensor("x_113_perm_0"), val = tensor([0, 2, 1])]; tensor input_237_pad_0 = const()[name = tensor("input_237_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_237_mode_0 = const()[name = tensor("input_237_mode_0"), val = tensor("constant")]; tensor const_53_to_fp16 = const()[name = tensor("const_53_to_fp16"), val = tensor(0x0p+0)]; tensor x_113_cast_fp16 = transpose(perm = x_113_perm_0, x = inputs_35_cast_fp16)[name = tensor("transpose_143")]; tensor input_237_cast_fp16 = pad(constant_val = const_53_to_fp16, mode = input_237_mode_0, pad = input_237_pad_0, x = x_113_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor x_115_pad_type_0 = const()[name = tensor("x_115_pad_type_0"), val = tensor("valid")]; tensor x_115_groups_0 = const()[name = tensor("x_115_groups_0"), val = tensor(512)]; tensor x_115_strides_0 = const()[name = tensor("x_115_strides_0"), val = tensor([1])]; tensor x_115_pad_0 = const()[name = tensor("x_115_pad_0"), val = tensor([0, 0])]; tensor x_115_dilations_0 = const()[name = tensor("x_115_dilations_0"), val = tensor([1])]; tensor d_decoders_8_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27609600))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27615296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_115_cast_fp16 = conv(dilations = x_115_dilations_0, groups = x_115_groups_0, pad = x_115_pad_0, pad_type = x_115_pad_type_0, strides = x_115_strides_0, weight = d_decoders_8_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_237_cast_fp16)[name = tensor("x_115_cast_fp16")]; tensor x_117_perm_0 = const()[name = tensor("x_117_perm_0"), val = tensor([0, 2, 1])]; tensor x_117_cast_fp16 = transpose(perm = x_117_perm_0, x = x_115_cast_fp16)[name = tensor("transpose_142")]; tensor input_239_cast_fp16 = add(x = x_117_cast_fp16, y = inputs_35_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor input_241_cast_fp16 = mul(x = input_239_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_241_cast_fp16")]; tensor input_243_cast_fp16 = add(x = input_223_cast_fp16, y = input_241_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor x_123_axes_0 = const()[name = tensor("x_123_axes_0"), val = tensor([-1])]; tensor d_decoders_8_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_8_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27616384)))]; tensor d_decoders_8_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_8_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27617472)))]; tensor x_123_cast_fp16 = layer_norm(axes = x_123_axes_0, beta = d_decoders_8_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_8_norm3_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("x_123_cast_fp16")]; tensor d_decoders_8_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27618560))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27880768))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_8_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_8_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27881856)))]; tensor linear_42_cast_fp16 = linear(bias = d_decoders_8_src_attn_linear_q_bias_to_fp16, weight = d_decoders_8_src_attn_linear_q_weight_to_fp16_quantized, x = x_123_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor var_888 = const()[name = tensor("op_888"), val = tensor([1, -1, 4, 128])]; tensor var_889_cast_fp16 = reshape(shape = var_888, x = linear_42_cast_fp16)[name = tensor("op_889_cast_fp16")]; tensor d_decoders_8_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27882944))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28407296))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_8_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_8_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28409408)))]; tensor linear_43_cast_fp16 = linear(bias = d_decoders_8_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_8_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_43_cast_fp16")]; tensor tile_8 = const()[name = tensor("tile_8"), val = tensor([512, 512])]; tensor var_894_axis_0 = const()[name = tensor("op_894_axis_0"), val = tensor(-1)]; tensor var_894_cast_fp16_0, tensor var_894_cast_fp16_1 = split(axis = var_894_axis_0, split_sizes = tile_8, x = linear_43_cast_fp16)[name = tensor("op_894_cast_fp16")]; tensor var_897 = const()[name = tensor("op_897"), val = tensor([1, -1, 4, 128])]; tensor var_898_cast_fp16 = reshape(shape = var_897, x = var_894_cast_fp16_0)[name = tensor("op_898_cast_fp16")]; tensor var_900 = const()[name = tensor("op_900"), val = tensor([1, -1, 4, 128])]; tensor var_901_cast_fp16 = reshape(shape = var_900, x = var_894_cast_fp16_1)[name = tensor("op_901_cast_fp16")]; tensor value_17_perm_0 = const()[name = tensor("value_17_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_903_to_fp16 = const()[name = tensor("op_903_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_35_cast_fp16 = mul(x = var_889_cast_fp16, y = var_903_to_fp16)[name = tensor("q_h_35_cast_fp16")]; tensor scores_33_transpose_x_0 = const()[name = tensor("scores_33_transpose_x_0"), val = tensor(false)]; tensor scores_33_transpose_y_0 = const()[name = tensor("scores_33_transpose_y_0"), val = tensor(false)]; tensor transpose_80_perm_0 = const()[name = tensor("transpose_80_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_81_perm_0 = const()[name = tensor("transpose_81_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_81 = transpose(perm = transpose_81_perm_0, x = var_898_cast_fp16)[name = tensor("transpose_140")]; tensor transpose_80 = transpose(perm = transpose_80_perm_0, x = q_h_35_cast_fp16)[name = tensor("transpose_141")]; tensor scores_33_cast_fp16 = matmul(transpose_x = scores_33_transpose_x_0, transpose_y = scores_33_transpose_y_0, x = transpose_80, y = transpose_81)[name = tensor("scores_33_cast_fp16")]; tensor scores_35_cast_fp16 = select(a = var_8_to_fp16, b = scores_33_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_35_cast_fp16")]; tensor var_911_cast_fp16 = softmax(axis = var_20, x = scores_35_cast_fp16)[name = tensor("op_911_cast_fp16")]; tensor input_245_cast_fp16 = select(a = var_9_to_fp16, b = var_911_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor x_125_transpose_x_0 = const()[name = tensor("x_125_transpose_x_0"), val = tensor(false)]; tensor x_125_transpose_y_0 = const()[name = tensor("x_125_transpose_y_0"), val = tensor(false)]; tensor value_17_cast_fp16 = transpose(perm = value_17_perm_0, x = var_901_cast_fp16)[name = tensor("transpose_139")]; tensor x_125_cast_fp16 = matmul(transpose_x = x_125_transpose_x_0, transpose_y = x_125_transpose_y_0, x = input_245_cast_fp16, y = value_17_cast_fp16)[name = tensor("x_125_cast_fp16")]; tensor var_915_perm_0 = const()[name = tensor("op_915_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_917 = const()[name = tensor("op_917"), val = tensor([1, -1, 512])]; tensor var_915_cast_fp16 = transpose(perm = var_915_perm_0, x = x_125_cast_fp16)[name = tensor("transpose_138")]; tensor input_247_cast_fp16 = reshape(shape = var_917, x = var_915_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor d_decoders_8_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_8_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28411520))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28673728))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_8_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_8_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28674816)))]; tensor linear_44_cast_fp16 = linear(bias = d_decoders_8_src_attn_linear_out_bias_to_fp16, weight = d_decoders_8_src_attn_linear_out_weight_to_fp16_quantized, x = input_247_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor input_251_cast_fp16 = add(x = input_243_cast_fp16, y = linear_44_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor input_253_axes_0 = const()[name = tensor("input_253_axes_0"), val = tensor([-1])]; tensor d_decoders_9_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_9_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28675904)))]; tensor d_decoders_9_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_9_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28676992)))]; tensor input_253_cast_fp16 = layer_norm(axes = input_253_axes_0, beta = d_decoders_9_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_9_norm1_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("input_253_cast_fp16")]; tensor d_decoders_9_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28678080))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29726720))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_9_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_9_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29730880)))]; tensor linear_45_cast_fp16 = linear(bias = d_decoders_9_feed_forward_w_1_bias_to_fp16, weight = d_decoders_9_feed_forward_w_1_weight_to_fp16_quantized, x = input_253_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor input_257_cast_fp16 = relu(x = linear_45_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor input_261_axes_0 = const()[name = tensor("input_261_axes_0"), val = tensor([-1])]; tensor d_decoders_9_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_9_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29735040)))]; tensor d_decoders_9_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_9_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29739200)))]; tensor input_261_cast_fp16 = layer_norm(axes = input_261_axes_0, beta = d_decoders_9_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_9_feed_forward_norm_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor d_decoders_9_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29743360))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30792000))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_46_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_9_feed_forward_w_2_weight_to_fp16_quantized, x = input_261_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor inputs_37_axes_0 = const()[name = tensor("inputs_37_axes_0"), val = tensor([-1])]; tensor d_decoders_9_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_9_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30793088)))]; tensor d_decoders_9_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_9_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30794176)))]; tensor inputs_37_cast_fp16 = layer_norm(axes = inputs_37_axes_0, beta = d_decoders_9_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_9_norm2_weight_to_fp16, x = linear_46_cast_fp16)[name = tensor("inputs_37_cast_fp16")]; tensor inputs_39_cast_fp16 = mul(x = inputs_37_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_39_cast_fp16")]; tensor x_127_perm_0 = const()[name = tensor("x_127_perm_0"), val = tensor([0, 2, 1])]; tensor input_265_pad_0 = const()[name = tensor("input_265_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_265_mode_0 = const()[name = tensor("input_265_mode_0"), val = tensor("constant")]; tensor const_59_to_fp16 = const()[name = tensor("const_59_to_fp16"), val = tensor(0x0p+0)]; tensor x_127_cast_fp16 = transpose(perm = x_127_perm_0, x = inputs_39_cast_fp16)[name = tensor("transpose_137")]; tensor input_265_cast_fp16 = pad(constant_val = const_59_to_fp16, mode = input_265_mode_0, pad = input_265_pad_0, x = x_127_cast_fp16)[name = tensor("input_265_cast_fp16")]; tensor x_129_pad_type_0 = const()[name = tensor("x_129_pad_type_0"), val = tensor("valid")]; tensor x_129_groups_0 = const()[name = tensor("x_129_groups_0"), val = tensor(512)]; tensor x_129_strides_0 = const()[name = tensor("x_129_strides_0"), val = tensor([1])]; tensor x_129_pad_0 = const()[name = tensor("x_129_pad_0"), val = tensor([0, 0])]; tensor x_129_dilations_0 = const()[name = tensor("x_129_dilations_0"), val = tensor([1])]; tensor d_decoders_9_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30795264))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30800960))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_129_cast_fp16 = conv(dilations = x_129_dilations_0, groups = x_129_groups_0, pad = x_129_pad_0, pad_type = x_129_pad_type_0, strides = x_129_strides_0, weight = d_decoders_9_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_265_cast_fp16)[name = tensor("x_129_cast_fp16")]; tensor x_131_perm_0 = const()[name = tensor("x_131_perm_0"), val = tensor([0, 2, 1])]; tensor x_131_cast_fp16 = transpose(perm = x_131_perm_0, x = x_129_cast_fp16)[name = tensor("transpose_136")]; tensor input_267_cast_fp16 = add(x = x_131_cast_fp16, y = inputs_39_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor input_269_cast_fp16 = mul(x = input_267_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_269_cast_fp16")]; tensor input_271_cast_fp16 = add(x = input_251_cast_fp16, y = input_269_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor x_137_axes_0 = const()[name = tensor("x_137_axes_0"), val = tensor([-1])]; tensor d_decoders_9_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_9_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30802048)))]; tensor d_decoders_9_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_9_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30803136)))]; tensor x_137_cast_fp16 = layer_norm(axes = x_137_axes_0, beta = d_decoders_9_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_9_norm3_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("x_137_cast_fp16")]; tensor d_decoders_9_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30804224))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31066432))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_9_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_9_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31067520)))]; tensor linear_47_cast_fp16 = linear(bias = d_decoders_9_src_attn_linear_q_bias_to_fp16, weight = d_decoders_9_src_attn_linear_q_weight_to_fp16_quantized, x = x_137_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor var_983 = const()[name = tensor("op_983"), val = tensor([1, -1, 4, 128])]; tensor var_984_cast_fp16 = reshape(shape = var_983, x = linear_47_cast_fp16)[name = tensor("op_984_cast_fp16")]; tensor d_decoders_9_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31068608))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31592960))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_9_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_9_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31595072)))]; tensor linear_48_cast_fp16 = linear(bias = d_decoders_9_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_9_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_48_cast_fp16")]; tensor tile_9 = const()[name = tensor("tile_9"), val = tensor([512, 512])]; tensor var_989_axis_0 = const()[name = tensor("op_989_axis_0"), val = tensor(-1)]; tensor var_989_cast_fp16_0, tensor var_989_cast_fp16_1 = split(axis = var_989_axis_0, split_sizes = tile_9, x = linear_48_cast_fp16)[name = tensor("op_989_cast_fp16")]; tensor var_992 = const()[name = tensor("op_992"), val = tensor([1, -1, 4, 128])]; tensor var_993_cast_fp16 = reshape(shape = var_992, x = var_989_cast_fp16_0)[name = tensor("op_993_cast_fp16")]; tensor var_995 = const()[name = tensor("op_995"), val = tensor([1, -1, 4, 128])]; tensor var_996_cast_fp16 = reshape(shape = var_995, x = var_989_cast_fp16_1)[name = tensor("op_996_cast_fp16")]; tensor value_19_perm_0 = const()[name = tensor("value_19_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_998_to_fp16 = const()[name = tensor("op_998_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_39_cast_fp16 = mul(x = var_984_cast_fp16, y = var_998_to_fp16)[name = tensor("q_h_39_cast_fp16")]; tensor scores_37_transpose_x_0 = const()[name = tensor("scores_37_transpose_x_0"), val = tensor(false)]; tensor scores_37_transpose_y_0 = const()[name = tensor("scores_37_transpose_y_0"), val = tensor(false)]; tensor transpose_82_perm_0 = const()[name = tensor("transpose_82_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_83_perm_0 = const()[name = tensor("transpose_83_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_83 = transpose(perm = transpose_83_perm_0, x = var_993_cast_fp16)[name = tensor("transpose_134")]; tensor transpose_82 = transpose(perm = transpose_82_perm_0, x = q_h_39_cast_fp16)[name = tensor("transpose_135")]; tensor scores_37_cast_fp16 = matmul(transpose_x = scores_37_transpose_x_0, transpose_y = scores_37_transpose_y_0, x = transpose_82, y = transpose_83)[name = tensor("scores_37_cast_fp16")]; tensor scores_39_cast_fp16 = select(a = var_8_to_fp16, b = scores_37_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_39_cast_fp16")]; tensor var_1006_cast_fp16 = softmax(axis = var_20, x = scores_39_cast_fp16)[name = tensor("op_1006_cast_fp16")]; tensor input_273_cast_fp16 = select(a = var_9_to_fp16, b = var_1006_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor x_139_transpose_x_0 = const()[name = tensor("x_139_transpose_x_0"), val = tensor(false)]; tensor x_139_transpose_y_0 = const()[name = tensor("x_139_transpose_y_0"), val = tensor(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = var_996_cast_fp16)[name = tensor("transpose_133")]; tensor x_139_cast_fp16 = matmul(transpose_x = x_139_transpose_x_0, transpose_y = x_139_transpose_y_0, x = input_273_cast_fp16, y = value_19_cast_fp16)[name = tensor("x_139_cast_fp16")]; tensor var_1010_perm_0 = const()[name = tensor("op_1010_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1012 = const()[name = tensor("op_1012"), val = tensor([1, -1, 512])]; tensor var_1010_cast_fp16 = transpose(perm = var_1010_perm_0, x = x_139_cast_fp16)[name = tensor("transpose_132")]; tensor input_275_cast_fp16 = reshape(shape = var_1012, x = var_1010_cast_fp16)[name = tensor("input_275_cast_fp16")]; tensor d_decoders_9_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_9_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31597184))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31859392))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_9_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_9_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31860480)))]; tensor linear_49_cast_fp16 = linear(bias = d_decoders_9_src_attn_linear_out_bias_to_fp16, weight = d_decoders_9_src_attn_linear_out_weight_to_fp16_quantized, x = input_275_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor input_279_cast_fp16 = add(x = input_271_cast_fp16, y = linear_49_cast_fp16)[name = tensor("input_279_cast_fp16")]; tensor input_281_axes_0 = const()[name = tensor("input_281_axes_0"), val = tensor([-1])]; tensor d_decoders_10_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_10_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31861568)))]; tensor d_decoders_10_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_10_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31862656)))]; tensor input_281_cast_fp16 = layer_norm(axes = input_281_axes_0, beta = d_decoders_10_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_10_norm1_weight_to_fp16, x = input_279_cast_fp16)[name = tensor("input_281_cast_fp16")]; tensor d_decoders_10_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31863744))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32912384))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_10_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_10_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32916544)))]; tensor linear_50_cast_fp16 = linear(bias = d_decoders_10_feed_forward_w_1_bias_to_fp16, weight = d_decoders_10_feed_forward_w_1_weight_to_fp16_quantized, x = input_281_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor input_285_cast_fp16 = relu(x = linear_50_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor input_289_axes_0 = const()[name = tensor("input_289_axes_0"), val = tensor([-1])]; tensor d_decoders_10_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_10_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32920704)))]; tensor d_decoders_10_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_10_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32924864)))]; tensor input_289_cast_fp16 = layer_norm(axes = input_289_axes_0, beta = d_decoders_10_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_10_feed_forward_norm_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("input_289_cast_fp16")]; tensor d_decoders_10_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32929024))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33977664))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_51_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_10_feed_forward_w_2_weight_to_fp16_quantized, x = input_289_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor inputs_41_axes_0 = const()[name = tensor("inputs_41_axes_0"), val = tensor([-1])]; tensor d_decoders_10_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_10_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33978752)))]; tensor d_decoders_10_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_10_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33979840)))]; tensor inputs_41_cast_fp16 = layer_norm(axes = inputs_41_axes_0, beta = d_decoders_10_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_10_norm2_weight_to_fp16, x = linear_51_cast_fp16)[name = tensor("inputs_41_cast_fp16")]; tensor inputs_43_cast_fp16 = mul(x = inputs_41_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_43_cast_fp16")]; tensor x_141_perm_0 = const()[name = tensor("x_141_perm_0"), val = tensor([0, 2, 1])]; tensor input_293_pad_0 = const()[name = tensor("input_293_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_293_mode_0 = const()[name = tensor("input_293_mode_0"), val = tensor("constant")]; tensor const_65_to_fp16 = const()[name = tensor("const_65_to_fp16"), val = tensor(0x0p+0)]; tensor x_141_cast_fp16 = transpose(perm = x_141_perm_0, x = inputs_43_cast_fp16)[name = tensor("transpose_131")]; tensor input_293_cast_fp16 = pad(constant_val = const_65_to_fp16, mode = input_293_mode_0, pad = input_293_pad_0, x = x_141_cast_fp16)[name = tensor("input_293_cast_fp16")]; tensor x_143_pad_type_0 = const()[name = tensor("x_143_pad_type_0"), val = tensor("valid")]; tensor x_143_groups_0 = const()[name = tensor("x_143_groups_0"), val = tensor(512)]; tensor x_143_strides_0 = const()[name = tensor("x_143_strides_0"), val = tensor([1])]; tensor x_143_pad_0 = const()[name = tensor("x_143_pad_0"), val = tensor([0, 0])]; tensor x_143_dilations_0 = const()[name = tensor("x_143_dilations_0"), val = tensor([1])]; tensor d_decoders_10_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33980928))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33986624))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_143_cast_fp16 = conv(dilations = x_143_dilations_0, groups = x_143_groups_0, pad = x_143_pad_0, pad_type = x_143_pad_type_0, strides = x_143_strides_0, weight = d_decoders_10_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_293_cast_fp16)[name = tensor("x_143_cast_fp16")]; tensor x_145_perm_0 = const()[name = tensor("x_145_perm_0"), val = tensor([0, 2, 1])]; tensor x_145_cast_fp16 = transpose(perm = x_145_perm_0, x = x_143_cast_fp16)[name = tensor("transpose_130")]; tensor input_295_cast_fp16 = add(x = x_145_cast_fp16, y = inputs_43_cast_fp16)[name = tensor("input_295_cast_fp16")]; tensor input_297_cast_fp16 = mul(x = input_295_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor input_299_cast_fp16 = add(x = input_279_cast_fp16, y = input_297_cast_fp16)[name = tensor("input_299_cast_fp16")]; tensor x_151_axes_0 = const()[name = tensor("x_151_axes_0"), val = tensor([-1])]; tensor d_decoders_10_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_10_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33987712)))]; tensor d_decoders_10_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_10_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33988800)))]; tensor x_151_cast_fp16 = layer_norm(axes = x_151_axes_0, beta = d_decoders_10_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_10_norm3_weight_to_fp16, x = input_299_cast_fp16)[name = tensor("x_151_cast_fp16")]; tensor d_decoders_10_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33989888))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34252096))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_10_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_10_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34253184)))]; tensor linear_52_cast_fp16 = linear(bias = d_decoders_10_src_attn_linear_q_bias_to_fp16, weight = d_decoders_10_src_attn_linear_q_weight_to_fp16_quantized, x = x_151_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor var_1078 = const()[name = tensor("op_1078"), val = tensor([1, -1, 4, 128])]; tensor var_1079_cast_fp16 = reshape(shape = var_1078, x = linear_52_cast_fp16)[name = tensor("op_1079_cast_fp16")]; tensor d_decoders_10_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34254272))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34778624))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_10_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_10_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34780736)))]; tensor linear_53_cast_fp16 = linear(bias = d_decoders_10_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_10_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_53_cast_fp16")]; tensor tile_10 = const()[name = tensor("tile_10"), val = tensor([512, 512])]; tensor var_1084_axis_0 = const()[name = tensor("op_1084_axis_0"), val = tensor(-1)]; tensor var_1084_cast_fp16_0, tensor var_1084_cast_fp16_1 = split(axis = var_1084_axis_0, split_sizes = tile_10, x = linear_53_cast_fp16)[name = tensor("op_1084_cast_fp16")]; tensor var_1087 = const()[name = tensor("op_1087"), val = tensor([1, -1, 4, 128])]; tensor var_1088_cast_fp16 = reshape(shape = var_1087, x = var_1084_cast_fp16_0)[name = tensor("op_1088_cast_fp16")]; tensor var_1090 = const()[name = tensor("op_1090"), val = tensor([1, -1, 4, 128])]; tensor var_1091_cast_fp16 = reshape(shape = var_1090, x = var_1084_cast_fp16_1)[name = tensor("op_1091_cast_fp16")]; tensor value_21_perm_0 = const()[name = tensor("value_21_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1093_to_fp16 = const()[name = tensor("op_1093_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_43_cast_fp16 = mul(x = var_1079_cast_fp16, y = var_1093_to_fp16)[name = tensor("q_h_43_cast_fp16")]; tensor scores_41_transpose_x_0 = const()[name = tensor("scores_41_transpose_x_0"), val = tensor(false)]; tensor scores_41_transpose_y_0 = const()[name = tensor("scores_41_transpose_y_0"), val = tensor(false)]; tensor transpose_84_perm_0 = const()[name = tensor("transpose_84_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_85_perm_0 = const()[name = tensor("transpose_85_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_85 = transpose(perm = transpose_85_perm_0, x = var_1088_cast_fp16)[name = tensor("transpose_128")]; tensor transpose_84 = transpose(perm = transpose_84_perm_0, x = q_h_43_cast_fp16)[name = tensor("transpose_129")]; tensor scores_41_cast_fp16 = matmul(transpose_x = scores_41_transpose_x_0, transpose_y = scores_41_transpose_y_0, x = transpose_84, y = transpose_85)[name = tensor("scores_41_cast_fp16")]; tensor scores_43_cast_fp16 = select(a = var_8_to_fp16, b = scores_41_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_43_cast_fp16")]; tensor var_1101_cast_fp16 = softmax(axis = var_20, x = scores_43_cast_fp16)[name = tensor("op_1101_cast_fp16")]; tensor input_301_cast_fp16 = select(a = var_9_to_fp16, b = var_1101_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_301_cast_fp16")]; tensor x_153_transpose_x_0 = const()[name = tensor("x_153_transpose_x_0"), val = tensor(false)]; tensor x_153_transpose_y_0 = const()[name = tensor("x_153_transpose_y_0"), val = tensor(false)]; tensor value_21_cast_fp16 = transpose(perm = value_21_perm_0, x = var_1091_cast_fp16)[name = tensor("transpose_127")]; tensor x_153_cast_fp16 = matmul(transpose_x = x_153_transpose_x_0, transpose_y = x_153_transpose_y_0, x = input_301_cast_fp16, y = value_21_cast_fp16)[name = tensor("x_153_cast_fp16")]; tensor var_1105_perm_0 = const()[name = tensor("op_1105_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1107 = const()[name = tensor("op_1107"), val = tensor([1, -1, 512])]; tensor var_1105_cast_fp16 = transpose(perm = var_1105_perm_0, x = x_153_cast_fp16)[name = tensor("transpose_126")]; tensor input_303_cast_fp16 = reshape(shape = var_1107, x = var_1105_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor d_decoders_10_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_10_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34782848))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35045056))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_10_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_10_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35046144)))]; tensor linear_54_cast_fp16 = linear(bias = d_decoders_10_src_attn_linear_out_bias_to_fp16, weight = d_decoders_10_src_attn_linear_out_weight_to_fp16_quantized, x = input_303_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor input_307_cast_fp16 = add(x = input_299_cast_fp16, y = linear_54_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor input_309_axes_0 = const()[name = tensor("input_309_axes_0"), val = tensor([-1])]; tensor d_decoders_11_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_11_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35047232)))]; tensor d_decoders_11_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_11_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35048320)))]; tensor input_309_cast_fp16 = layer_norm(axes = input_309_axes_0, beta = d_decoders_11_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_11_norm1_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("input_309_cast_fp16")]; tensor d_decoders_11_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35049408))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36098048))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_11_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_11_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36102208)))]; tensor linear_55_cast_fp16 = linear(bias = d_decoders_11_feed_forward_w_1_bias_to_fp16, weight = d_decoders_11_feed_forward_w_1_weight_to_fp16_quantized, x = input_309_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor input_313_cast_fp16 = relu(x = linear_55_cast_fp16)[name = tensor("input_313_cast_fp16")]; tensor input_317_axes_0 = const()[name = tensor("input_317_axes_0"), val = tensor([-1])]; tensor d_decoders_11_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_11_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36106368)))]; tensor d_decoders_11_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_11_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36110528)))]; tensor input_317_cast_fp16 = layer_norm(axes = input_317_axes_0, beta = d_decoders_11_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_11_feed_forward_norm_weight_to_fp16, x = input_313_cast_fp16)[name = tensor("input_317_cast_fp16")]; tensor d_decoders_11_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36114688))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37163328))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_56_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_11_feed_forward_w_2_weight_to_fp16_quantized, x = input_317_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor inputs_45_axes_0 = const()[name = tensor("inputs_45_axes_0"), val = tensor([-1])]; tensor d_decoders_11_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_11_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37164416)))]; tensor d_decoders_11_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_11_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37165504)))]; tensor inputs_45_cast_fp16 = layer_norm(axes = inputs_45_axes_0, beta = d_decoders_11_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_11_norm2_weight_to_fp16, x = linear_56_cast_fp16)[name = tensor("inputs_45_cast_fp16")]; tensor inputs_47_cast_fp16 = mul(x = inputs_45_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_47_cast_fp16")]; tensor x_155_perm_0 = const()[name = tensor("x_155_perm_0"), val = tensor([0, 2, 1])]; tensor input_321_pad_0 = const()[name = tensor("input_321_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_321_mode_0 = const()[name = tensor("input_321_mode_0"), val = tensor("constant")]; tensor const_71_to_fp16 = const()[name = tensor("const_71_to_fp16"), val = tensor(0x0p+0)]; tensor x_155_cast_fp16 = transpose(perm = x_155_perm_0, x = inputs_47_cast_fp16)[name = tensor("transpose_125")]; tensor input_321_cast_fp16 = pad(constant_val = const_71_to_fp16, mode = input_321_mode_0, pad = input_321_pad_0, x = x_155_cast_fp16)[name = tensor("input_321_cast_fp16")]; tensor x_157_pad_type_0 = const()[name = tensor("x_157_pad_type_0"), val = tensor("valid")]; tensor x_157_groups_0 = const()[name = tensor("x_157_groups_0"), val = tensor(512)]; tensor x_157_strides_0 = const()[name = tensor("x_157_strides_0"), val = tensor([1])]; tensor x_157_pad_0 = const()[name = tensor("x_157_pad_0"), val = tensor([0, 0])]; tensor x_157_dilations_0 = const()[name = tensor("x_157_dilations_0"), val = tensor([1])]; tensor d_decoders_11_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37166592))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37172288))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_157_cast_fp16 = conv(dilations = x_157_dilations_0, groups = x_157_groups_0, pad = x_157_pad_0, pad_type = x_157_pad_type_0, strides = x_157_strides_0, weight = d_decoders_11_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_321_cast_fp16)[name = tensor("x_157_cast_fp16")]; tensor x_159_perm_0 = const()[name = tensor("x_159_perm_0"), val = tensor([0, 2, 1])]; tensor x_159_cast_fp16 = transpose(perm = x_159_perm_0, x = x_157_cast_fp16)[name = tensor("transpose_124")]; tensor input_323_cast_fp16 = add(x = x_159_cast_fp16, y = inputs_47_cast_fp16)[name = tensor("input_323_cast_fp16")]; tensor input_325_cast_fp16 = mul(x = input_323_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_325_cast_fp16")]; tensor input_327_cast_fp16 = add(x = input_307_cast_fp16, y = input_325_cast_fp16)[name = tensor("input_327_cast_fp16")]; tensor x_165_axes_0 = const()[name = tensor("x_165_axes_0"), val = tensor([-1])]; tensor d_decoders_11_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_11_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37173376)))]; tensor d_decoders_11_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_11_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37174464)))]; tensor x_165_cast_fp16 = layer_norm(axes = x_165_axes_0, beta = d_decoders_11_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_11_norm3_weight_to_fp16, x = input_327_cast_fp16)[name = tensor("x_165_cast_fp16")]; tensor d_decoders_11_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37175552))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37437760))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_11_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_11_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37438848)))]; tensor linear_57_cast_fp16 = linear(bias = d_decoders_11_src_attn_linear_q_bias_to_fp16, weight = d_decoders_11_src_attn_linear_q_weight_to_fp16_quantized, x = x_165_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor var_1173 = const()[name = tensor("op_1173"), val = tensor([1, -1, 4, 128])]; tensor var_1174_cast_fp16 = reshape(shape = var_1173, x = linear_57_cast_fp16)[name = tensor("op_1174_cast_fp16")]; tensor d_decoders_11_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37439936))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37964288))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_11_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_11_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37966400)))]; tensor linear_58_cast_fp16 = linear(bias = d_decoders_11_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_11_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_58_cast_fp16")]; tensor tile_11 = const()[name = tensor("tile_11"), val = tensor([512, 512])]; tensor var_1179_axis_0 = const()[name = tensor("op_1179_axis_0"), val = tensor(-1)]; tensor var_1179_cast_fp16_0, tensor var_1179_cast_fp16_1 = split(axis = var_1179_axis_0, split_sizes = tile_11, x = linear_58_cast_fp16)[name = tensor("op_1179_cast_fp16")]; tensor var_1182 = const()[name = tensor("op_1182"), val = tensor([1, -1, 4, 128])]; tensor var_1183_cast_fp16 = reshape(shape = var_1182, x = var_1179_cast_fp16_0)[name = tensor("op_1183_cast_fp16")]; tensor var_1185 = const()[name = tensor("op_1185"), val = tensor([1, -1, 4, 128])]; tensor var_1186_cast_fp16 = reshape(shape = var_1185, x = var_1179_cast_fp16_1)[name = tensor("op_1186_cast_fp16")]; tensor value_23_perm_0 = const()[name = tensor("value_23_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1188_to_fp16 = const()[name = tensor("op_1188_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_47_cast_fp16 = mul(x = var_1174_cast_fp16, y = var_1188_to_fp16)[name = tensor("q_h_47_cast_fp16")]; tensor scores_45_transpose_x_0 = const()[name = tensor("scores_45_transpose_x_0"), val = tensor(false)]; tensor scores_45_transpose_y_0 = const()[name = tensor("scores_45_transpose_y_0"), val = tensor(false)]; tensor transpose_86_perm_0 = const()[name = tensor("transpose_86_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_87_perm_0 = const()[name = tensor("transpose_87_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_87 = transpose(perm = transpose_87_perm_0, x = var_1183_cast_fp16)[name = tensor("transpose_122")]; tensor transpose_86 = transpose(perm = transpose_86_perm_0, x = q_h_47_cast_fp16)[name = tensor("transpose_123")]; tensor scores_45_cast_fp16 = matmul(transpose_x = scores_45_transpose_x_0, transpose_y = scores_45_transpose_y_0, x = transpose_86, y = transpose_87)[name = tensor("scores_45_cast_fp16")]; tensor scores_47_cast_fp16 = select(a = var_8_to_fp16, b = scores_45_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_47_cast_fp16")]; tensor var_1196_cast_fp16 = softmax(axis = var_20, x = scores_47_cast_fp16)[name = tensor("op_1196_cast_fp16")]; tensor input_329_cast_fp16 = select(a = var_9_to_fp16, b = var_1196_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_329_cast_fp16")]; tensor x_167_transpose_x_0 = const()[name = tensor("x_167_transpose_x_0"), val = tensor(false)]; tensor x_167_transpose_y_0 = const()[name = tensor("x_167_transpose_y_0"), val = tensor(false)]; tensor value_23_cast_fp16 = transpose(perm = value_23_perm_0, x = var_1186_cast_fp16)[name = tensor("transpose_121")]; tensor x_167_cast_fp16 = matmul(transpose_x = x_167_transpose_x_0, transpose_y = x_167_transpose_y_0, x = input_329_cast_fp16, y = value_23_cast_fp16)[name = tensor("x_167_cast_fp16")]; tensor var_1200_perm_0 = const()[name = tensor("op_1200_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1202 = const()[name = tensor("op_1202"), val = tensor([1, -1, 512])]; tensor var_1200_cast_fp16 = transpose(perm = var_1200_perm_0, x = x_167_cast_fp16)[name = tensor("transpose_120")]; tensor input_331_cast_fp16 = reshape(shape = var_1202, x = var_1200_cast_fp16)[name = tensor("input_331_cast_fp16")]; tensor d_decoders_11_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_11_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37968512))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38230720))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_11_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_11_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38231808)))]; tensor linear_59_cast_fp16 = linear(bias = d_decoders_11_src_attn_linear_out_bias_to_fp16, weight = d_decoders_11_src_attn_linear_out_weight_to_fp16_quantized, x = input_331_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor input_335_cast_fp16 = add(x = input_327_cast_fp16, y = linear_59_cast_fp16)[name = tensor("input_335_cast_fp16")]; tensor input_337_axes_0 = const()[name = tensor("input_337_axes_0"), val = tensor([-1])]; tensor d_decoders_12_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_12_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38232896)))]; tensor d_decoders_12_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_12_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38233984)))]; tensor input_337_cast_fp16 = layer_norm(axes = input_337_axes_0, beta = d_decoders_12_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_12_norm1_weight_to_fp16, x = input_335_cast_fp16)[name = tensor("input_337_cast_fp16")]; tensor d_decoders_12_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38235072))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39283712))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_12_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_12_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39287872)))]; tensor linear_60_cast_fp16 = linear(bias = d_decoders_12_feed_forward_w_1_bias_to_fp16, weight = d_decoders_12_feed_forward_w_1_weight_to_fp16_quantized, x = input_337_cast_fp16)[name = tensor("linear_60_cast_fp16")]; tensor input_341_cast_fp16 = relu(x = linear_60_cast_fp16)[name = tensor("input_341_cast_fp16")]; tensor input_345_axes_0 = const()[name = tensor("input_345_axes_0"), val = tensor([-1])]; tensor d_decoders_12_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_12_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39292032)))]; tensor d_decoders_12_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_12_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39296192)))]; tensor input_345_cast_fp16 = layer_norm(axes = input_345_axes_0, beta = d_decoders_12_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_12_feed_forward_norm_weight_to_fp16, x = input_341_cast_fp16)[name = tensor("input_345_cast_fp16")]; tensor d_decoders_12_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39300352))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40348992))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_61_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_12_feed_forward_w_2_weight_to_fp16_quantized, x = input_345_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor inputs_49_axes_0 = const()[name = tensor("inputs_49_axes_0"), val = tensor([-1])]; tensor d_decoders_12_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_12_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40350080)))]; tensor d_decoders_12_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_12_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40351168)))]; tensor inputs_49_cast_fp16 = layer_norm(axes = inputs_49_axes_0, beta = d_decoders_12_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_12_norm2_weight_to_fp16, x = linear_61_cast_fp16)[name = tensor("inputs_49_cast_fp16")]; tensor inputs_51_cast_fp16 = mul(x = inputs_49_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_51_cast_fp16")]; tensor x_169_perm_0 = const()[name = tensor("x_169_perm_0"), val = tensor([0, 2, 1])]; tensor input_349_pad_0 = const()[name = tensor("input_349_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_349_mode_0 = const()[name = tensor("input_349_mode_0"), val = tensor("constant")]; tensor const_77_to_fp16 = const()[name = tensor("const_77_to_fp16"), val = tensor(0x0p+0)]; tensor x_169_cast_fp16 = transpose(perm = x_169_perm_0, x = inputs_51_cast_fp16)[name = tensor("transpose_119")]; tensor input_349_cast_fp16 = pad(constant_val = const_77_to_fp16, mode = input_349_mode_0, pad = input_349_pad_0, x = x_169_cast_fp16)[name = tensor("input_349_cast_fp16")]; tensor x_171_pad_type_0 = const()[name = tensor("x_171_pad_type_0"), val = tensor("valid")]; tensor x_171_groups_0 = const()[name = tensor("x_171_groups_0"), val = tensor(512)]; tensor x_171_strides_0 = const()[name = tensor("x_171_strides_0"), val = tensor([1])]; tensor x_171_pad_0 = const()[name = tensor("x_171_pad_0"), val = tensor([0, 0])]; tensor x_171_dilations_0 = const()[name = tensor("x_171_dilations_0"), val = tensor([1])]; tensor d_decoders_12_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40352256))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40357952))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_171_cast_fp16 = conv(dilations = x_171_dilations_0, groups = x_171_groups_0, pad = x_171_pad_0, pad_type = x_171_pad_type_0, strides = x_171_strides_0, weight = d_decoders_12_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_349_cast_fp16)[name = tensor("x_171_cast_fp16")]; tensor x_173_perm_0 = const()[name = tensor("x_173_perm_0"), val = tensor([0, 2, 1])]; tensor x_173_cast_fp16 = transpose(perm = x_173_perm_0, x = x_171_cast_fp16)[name = tensor("transpose_118")]; tensor input_351_cast_fp16 = add(x = x_173_cast_fp16, y = inputs_51_cast_fp16)[name = tensor("input_351_cast_fp16")]; tensor input_353_cast_fp16 = mul(x = input_351_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_353_cast_fp16")]; tensor input_355_cast_fp16 = add(x = input_335_cast_fp16, y = input_353_cast_fp16)[name = tensor("input_355_cast_fp16")]; tensor x_179_axes_0 = const()[name = tensor("x_179_axes_0"), val = tensor([-1])]; tensor d_decoders_12_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_12_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40359040)))]; tensor d_decoders_12_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_12_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40360128)))]; tensor x_179_cast_fp16 = layer_norm(axes = x_179_axes_0, beta = d_decoders_12_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_12_norm3_weight_to_fp16, x = input_355_cast_fp16)[name = tensor("x_179_cast_fp16")]; tensor d_decoders_12_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40361216))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40623424))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_12_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_12_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40624512)))]; tensor linear_62_cast_fp16 = linear(bias = d_decoders_12_src_attn_linear_q_bias_to_fp16, weight = d_decoders_12_src_attn_linear_q_weight_to_fp16_quantized, x = x_179_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor var_1268 = const()[name = tensor("op_1268"), val = tensor([1, -1, 4, 128])]; tensor var_1269_cast_fp16 = reshape(shape = var_1268, x = linear_62_cast_fp16)[name = tensor("op_1269_cast_fp16")]; tensor d_decoders_12_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40625600))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41149952))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_12_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_12_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41152064)))]; tensor linear_63_cast_fp16 = linear(bias = d_decoders_12_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_12_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_63_cast_fp16")]; tensor tile_12 = const()[name = tensor("tile_12"), val = tensor([512, 512])]; tensor var_1274_axis_0 = const()[name = tensor("op_1274_axis_0"), val = tensor(-1)]; tensor var_1274_cast_fp16_0, tensor var_1274_cast_fp16_1 = split(axis = var_1274_axis_0, split_sizes = tile_12, x = linear_63_cast_fp16)[name = tensor("op_1274_cast_fp16")]; tensor var_1277 = const()[name = tensor("op_1277"), val = tensor([1, -1, 4, 128])]; tensor var_1278_cast_fp16 = reshape(shape = var_1277, x = var_1274_cast_fp16_0)[name = tensor("op_1278_cast_fp16")]; tensor var_1280 = const()[name = tensor("op_1280"), val = tensor([1, -1, 4, 128])]; tensor var_1281_cast_fp16 = reshape(shape = var_1280, x = var_1274_cast_fp16_1)[name = tensor("op_1281_cast_fp16")]; tensor value_25_perm_0 = const()[name = tensor("value_25_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1283_to_fp16 = const()[name = tensor("op_1283_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_51_cast_fp16 = mul(x = var_1269_cast_fp16, y = var_1283_to_fp16)[name = tensor("q_h_51_cast_fp16")]; tensor scores_49_transpose_x_0 = const()[name = tensor("scores_49_transpose_x_0"), val = tensor(false)]; tensor scores_49_transpose_y_0 = const()[name = tensor("scores_49_transpose_y_0"), val = tensor(false)]; tensor transpose_88_perm_0 = const()[name = tensor("transpose_88_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_89_perm_0 = const()[name = tensor("transpose_89_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_89 = transpose(perm = transpose_89_perm_0, x = var_1278_cast_fp16)[name = tensor("transpose_116")]; tensor transpose_88 = transpose(perm = transpose_88_perm_0, x = q_h_51_cast_fp16)[name = tensor("transpose_117")]; tensor scores_49_cast_fp16 = matmul(transpose_x = scores_49_transpose_x_0, transpose_y = scores_49_transpose_y_0, x = transpose_88, y = transpose_89)[name = tensor("scores_49_cast_fp16")]; tensor scores_51_cast_fp16 = select(a = var_8_to_fp16, b = scores_49_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_51_cast_fp16")]; tensor var_1291_cast_fp16 = softmax(axis = var_20, x = scores_51_cast_fp16)[name = tensor("op_1291_cast_fp16")]; tensor input_357_cast_fp16 = select(a = var_9_to_fp16, b = var_1291_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_357_cast_fp16")]; tensor x_181_transpose_x_0 = const()[name = tensor("x_181_transpose_x_0"), val = tensor(false)]; tensor x_181_transpose_y_0 = const()[name = tensor("x_181_transpose_y_0"), val = tensor(false)]; tensor value_25_cast_fp16 = transpose(perm = value_25_perm_0, x = var_1281_cast_fp16)[name = tensor("transpose_115")]; tensor x_181_cast_fp16 = matmul(transpose_x = x_181_transpose_x_0, transpose_y = x_181_transpose_y_0, x = input_357_cast_fp16, y = value_25_cast_fp16)[name = tensor("x_181_cast_fp16")]; tensor var_1295_perm_0 = const()[name = tensor("op_1295_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1297 = const()[name = tensor("op_1297"), val = tensor([1, -1, 512])]; tensor var_1295_cast_fp16 = transpose(perm = var_1295_perm_0, x = x_181_cast_fp16)[name = tensor("transpose_114")]; tensor input_359_cast_fp16 = reshape(shape = var_1297, x = var_1295_cast_fp16)[name = tensor("input_359_cast_fp16")]; tensor d_decoders_12_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_12_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41154176))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41416384))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_12_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_12_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41417472)))]; tensor linear_64_cast_fp16 = linear(bias = d_decoders_12_src_attn_linear_out_bias_to_fp16, weight = d_decoders_12_src_attn_linear_out_weight_to_fp16_quantized, x = input_359_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor input_363_cast_fp16 = add(x = input_355_cast_fp16, y = linear_64_cast_fp16)[name = tensor("input_363_cast_fp16")]; tensor input_365_axes_0 = const()[name = tensor("input_365_axes_0"), val = tensor([-1])]; tensor d_decoders_13_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_13_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41418560)))]; tensor d_decoders_13_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_13_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41419648)))]; tensor input_365_cast_fp16 = layer_norm(axes = input_365_axes_0, beta = d_decoders_13_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_13_norm1_weight_to_fp16, x = input_363_cast_fp16)[name = tensor("input_365_cast_fp16")]; tensor d_decoders_13_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41420736))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42469376))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_13_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_13_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42473536)))]; tensor linear_65_cast_fp16 = linear(bias = d_decoders_13_feed_forward_w_1_bias_to_fp16, weight = d_decoders_13_feed_forward_w_1_weight_to_fp16_quantized, x = input_365_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor input_369_cast_fp16 = relu(x = linear_65_cast_fp16)[name = tensor("input_369_cast_fp16")]; tensor input_373_axes_0 = const()[name = tensor("input_373_axes_0"), val = tensor([-1])]; tensor d_decoders_13_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_13_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42477696)))]; tensor d_decoders_13_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_13_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42481856)))]; tensor input_373_cast_fp16 = layer_norm(axes = input_373_axes_0, beta = d_decoders_13_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_13_feed_forward_norm_weight_to_fp16, x = input_369_cast_fp16)[name = tensor("input_373_cast_fp16")]; tensor d_decoders_13_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42486016))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43534656))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_66_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_13_feed_forward_w_2_weight_to_fp16_quantized, x = input_373_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor inputs_53_axes_0 = const()[name = tensor("inputs_53_axes_0"), val = tensor([-1])]; tensor d_decoders_13_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_13_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43535744)))]; tensor d_decoders_13_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_13_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43536832)))]; tensor inputs_53_cast_fp16 = layer_norm(axes = inputs_53_axes_0, beta = d_decoders_13_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_13_norm2_weight_to_fp16, x = linear_66_cast_fp16)[name = tensor("inputs_53_cast_fp16")]; tensor inputs_55_cast_fp16 = mul(x = inputs_53_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_55_cast_fp16")]; tensor x_183_perm_0 = const()[name = tensor("x_183_perm_0"), val = tensor([0, 2, 1])]; tensor input_377_pad_0 = const()[name = tensor("input_377_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_377_mode_0 = const()[name = tensor("input_377_mode_0"), val = tensor("constant")]; tensor const_83_to_fp16 = const()[name = tensor("const_83_to_fp16"), val = tensor(0x0p+0)]; tensor x_183_cast_fp16 = transpose(perm = x_183_perm_0, x = inputs_55_cast_fp16)[name = tensor("transpose_113")]; tensor input_377_cast_fp16 = pad(constant_val = const_83_to_fp16, mode = input_377_mode_0, pad = input_377_pad_0, x = x_183_cast_fp16)[name = tensor("input_377_cast_fp16")]; tensor x_185_pad_type_0 = const()[name = tensor("x_185_pad_type_0"), val = tensor("valid")]; tensor x_185_groups_0 = const()[name = tensor("x_185_groups_0"), val = tensor(512)]; tensor x_185_strides_0 = const()[name = tensor("x_185_strides_0"), val = tensor([1])]; tensor x_185_pad_0 = const()[name = tensor("x_185_pad_0"), val = tensor([0, 0])]; tensor x_185_dilations_0 = const()[name = tensor("x_185_dilations_0"), val = tensor([1])]; tensor d_decoders_13_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43537920))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43543616))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_185_cast_fp16 = conv(dilations = x_185_dilations_0, groups = x_185_groups_0, pad = x_185_pad_0, pad_type = x_185_pad_type_0, strides = x_185_strides_0, weight = d_decoders_13_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_377_cast_fp16)[name = tensor("x_185_cast_fp16")]; tensor x_187_perm_0 = const()[name = tensor("x_187_perm_0"), val = tensor([0, 2, 1])]; tensor x_187_cast_fp16 = transpose(perm = x_187_perm_0, x = x_185_cast_fp16)[name = tensor("transpose_112")]; tensor input_379_cast_fp16 = add(x = x_187_cast_fp16, y = inputs_55_cast_fp16)[name = tensor("input_379_cast_fp16")]; tensor input_381_cast_fp16 = mul(x = input_379_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_381_cast_fp16")]; tensor input_383_cast_fp16 = add(x = input_363_cast_fp16, y = input_381_cast_fp16)[name = tensor("input_383_cast_fp16")]; tensor x_193_axes_0 = const()[name = tensor("x_193_axes_0"), val = tensor([-1])]; tensor d_decoders_13_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_13_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43544704)))]; tensor d_decoders_13_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_13_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43545792)))]; tensor x_193_cast_fp16 = layer_norm(axes = x_193_axes_0, beta = d_decoders_13_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_13_norm3_weight_to_fp16, x = input_383_cast_fp16)[name = tensor("x_193_cast_fp16")]; tensor d_decoders_13_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43546880))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43809088))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_13_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_13_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43810176)))]; tensor linear_67_cast_fp16 = linear(bias = d_decoders_13_src_attn_linear_q_bias_to_fp16, weight = d_decoders_13_src_attn_linear_q_weight_to_fp16_quantized, x = x_193_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor var_1363 = const()[name = tensor("op_1363"), val = tensor([1, -1, 4, 128])]; tensor var_1364_cast_fp16 = reshape(shape = var_1363, x = linear_67_cast_fp16)[name = tensor("op_1364_cast_fp16")]; tensor d_decoders_13_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43811264))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44335616))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_13_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_13_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44337728)))]; tensor linear_68_cast_fp16 = linear(bias = d_decoders_13_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_13_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_68_cast_fp16")]; tensor tile_13 = const()[name = tensor("tile_13"), val = tensor([512, 512])]; tensor var_1369_axis_0 = const()[name = tensor("op_1369_axis_0"), val = tensor(-1)]; tensor var_1369_cast_fp16_0, tensor var_1369_cast_fp16_1 = split(axis = var_1369_axis_0, split_sizes = tile_13, x = linear_68_cast_fp16)[name = tensor("op_1369_cast_fp16")]; tensor var_1372 = const()[name = tensor("op_1372"), val = tensor([1, -1, 4, 128])]; tensor var_1373_cast_fp16 = reshape(shape = var_1372, x = var_1369_cast_fp16_0)[name = tensor("op_1373_cast_fp16")]; tensor var_1375 = const()[name = tensor("op_1375"), val = tensor([1, -1, 4, 128])]; tensor var_1376_cast_fp16 = reshape(shape = var_1375, x = var_1369_cast_fp16_1)[name = tensor("op_1376_cast_fp16")]; tensor value_27_perm_0 = const()[name = tensor("value_27_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1378_to_fp16 = const()[name = tensor("op_1378_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_55_cast_fp16 = mul(x = var_1364_cast_fp16, y = var_1378_to_fp16)[name = tensor("q_h_55_cast_fp16")]; tensor scores_53_transpose_x_0 = const()[name = tensor("scores_53_transpose_x_0"), val = tensor(false)]; tensor scores_53_transpose_y_0 = const()[name = tensor("scores_53_transpose_y_0"), val = tensor(false)]; tensor transpose_90_perm_0 = const()[name = tensor("transpose_90_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_91_perm_0 = const()[name = tensor("transpose_91_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_91 = transpose(perm = transpose_91_perm_0, x = var_1373_cast_fp16)[name = tensor("transpose_110")]; tensor transpose_90 = transpose(perm = transpose_90_perm_0, x = q_h_55_cast_fp16)[name = tensor("transpose_111")]; tensor scores_53_cast_fp16 = matmul(transpose_x = scores_53_transpose_x_0, transpose_y = scores_53_transpose_y_0, x = transpose_90, y = transpose_91)[name = tensor("scores_53_cast_fp16")]; tensor scores_55_cast_fp16 = select(a = var_8_to_fp16, b = scores_53_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_55_cast_fp16")]; tensor var_1386_cast_fp16 = softmax(axis = var_20, x = scores_55_cast_fp16)[name = tensor("op_1386_cast_fp16")]; tensor input_385_cast_fp16 = select(a = var_9_to_fp16, b = var_1386_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_385_cast_fp16")]; tensor x_195_transpose_x_0 = const()[name = tensor("x_195_transpose_x_0"), val = tensor(false)]; tensor x_195_transpose_y_0 = const()[name = tensor("x_195_transpose_y_0"), val = tensor(false)]; tensor value_27_cast_fp16 = transpose(perm = value_27_perm_0, x = var_1376_cast_fp16)[name = tensor("transpose_109")]; tensor x_195_cast_fp16 = matmul(transpose_x = x_195_transpose_x_0, transpose_y = x_195_transpose_y_0, x = input_385_cast_fp16, y = value_27_cast_fp16)[name = tensor("x_195_cast_fp16")]; tensor var_1390_perm_0 = const()[name = tensor("op_1390_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1392 = const()[name = tensor("op_1392"), val = tensor([1, -1, 512])]; tensor var_1390_cast_fp16 = transpose(perm = var_1390_perm_0, x = x_195_cast_fp16)[name = tensor("transpose_108")]; tensor input_387_cast_fp16 = reshape(shape = var_1392, x = var_1390_cast_fp16)[name = tensor("input_387_cast_fp16")]; tensor d_decoders_13_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_13_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44339840))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44602048))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_13_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_13_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44603136)))]; tensor linear_69_cast_fp16 = linear(bias = d_decoders_13_src_attn_linear_out_bias_to_fp16, weight = d_decoders_13_src_attn_linear_out_weight_to_fp16_quantized, x = input_387_cast_fp16)[name = tensor("linear_69_cast_fp16")]; tensor input_391_cast_fp16 = add(x = input_383_cast_fp16, y = linear_69_cast_fp16)[name = tensor("input_391_cast_fp16")]; tensor input_393_axes_0 = const()[name = tensor("input_393_axes_0"), val = tensor([-1])]; tensor d_decoders_14_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_14_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44604224)))]; tensor d_decoders_14_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_14_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44605312)))]; tensor input_393_cast_fp16 = layer_norm(axes = input_393_axes_0, beta = d_decoders_14_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_14_norm1_weight_to_fp16, x = input_391_cast_fp16)[name = tensor("input_393_cast_fp16")]; tensor d_decoders_14_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44606400))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45655040))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_14_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_14_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45659200)))]; tensor linear_70_cast_fp16 = linear(bias = d_decoders_14_feed_forward_w_1_bias_to_fp16, weight = d_decoders_14_feed_forward_w_1_weight_to_fp16_quantized, x = input_393_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor input_397_cast_fp16 = relu(x = linear_70_cast_fp16)[name = tensor("input_397_cast_fp16")]; tensor input_401_axes_0 = const()[name = tensor("input_401_axes_0"), val = tensor([-1])]; tensor d_decoders_14_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_14_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45663360)))]; tensor d_decoders_14_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_14_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45667520)))]; tensor input_401_cast_fp16 = layer_norm(axes = input_401_axes_0, beta = d_decoders_14_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_14_feed_forward_norm_weight_to_fp16, x = input_397_cast_fp16)[name = tensor("input_401_cast_fp16")]; tensor d_decoders_14_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45671680))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46720320))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_71_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_14_feed_forward_w_2_weight_to_fp16_quantized, x = input_401_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor inputs_57_axes_0 = const()[name = tensor("inputs_57_axes_0"), val = tensor([-1])]; tensor d_decoders_14_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_14_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46721408)))]; tensor d_decoders_14_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_14_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46722496)))]; tensor inputs_57_cast_fp16 = layer_norm(axes = inputs_57_axes_0, beta = d_decoders_14_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_14_norm2_weight_to_fp16, x = linear_71_cast_fp16)[name = tensor("inputs_57_cast_fp16")]; tensor inputs_59_cast_fp16 = mul(x = inputs_57_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_59_cast_fp16")]; tensor x_197_perm_0 = const()[name = tensor("x_197_perm_0"), val = tensor([0, 2, 1])]; tensor input_405_pad_0 = const()[name = tensor("input_405_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_405_mode_0 = const()[name = tensor("input_405_mode_0"), val = tensor("constant")]; tensor const_89_to_fp16 = const()[name = tensor("const_89_to_fp16"), val = tensor(0x0p+0)]; tensor x_197_cast_fp16 = transpose(perm = x_197_perm_0, x = inputs_59_cast_fp16)[name = tensor("transpose_107")]; tensor input_405_cast_fp16 = pad(constant_val = const_89_to_fp16, mode = input_405_mode_0, pad = input_405_pad_0, x = x_197_cast_fp16)[name = tensor("input_405_cast_fp16")]; tensor x_199_pad_type_0 = const()[name = tensor("x_199_pad_type_0"), val = tensor("valid")]; tensor x_199_groups_0 = const()[name = tensor("x_199_groups_0"), val = tensor(512)]; tensor x_199_strides_0 = const()[name = tensor("x_199_strides_0"), val = tensor([1])]; tensor x_199_pad_0 = const()[name = tensor("x_199_pad_0"), val = tensor([0, 0])]; tensor x_199_dilations_0 = const()[name = tensor("x_199_dilations_0"), val = tensor([1])]; tensor d_decoders_14_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46723584))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46729280))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_199_cast_fp16 = conv(dilations = x_199_dilations_0, groups = x_199_groups_0, pad = x_199_pad_0, pad_type = x_199_pad_type_0, strides = x_199_strides_0, weight = d_decoders_14_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_405_cast_fp16)[name = tensor("x_199_cast_fp16")]; tensor x_201_perm_0 = const()[name = tensor("x_201_perm_0"), val = tensor([0, 2, 1])]; tensor x_201_cast_fp16 = transpose(perm = x_201_perm_0, x = x_199_cast_fp16)[name = tensor("transpose_106")]; tensor input_407_cast_fp16 = add(x = x_201_cast_fp16, y = inputs_59_cast_fp16)[name = tensor("input_407_cast_fp16")]; tensor input_409_cast_fp16 = mul(x = input_407_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_409_cast_fp16")]; tensor input_411_cast_fp16 = add(x = input_391_cast_fp16, y = input_409_cast_fp16)[name = tensor("input_411_cast_fp16")]; tensor x_207_axes_0 = const()[name = tensor("x_207_axes_0"), val = tensor([-1])]; tensor d_decoders_14_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_14_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46730368)))]; tensor d_decoders_14_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_14_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46731456)))]; tensor x_207_cast_fp16 = layer_norm(axes = x_207_axes_0, beta = d_decoders_14_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_14_norm3_weight_to_fp16, x = input_411_cast_fp16)[name = tensor("x_207_cast_fp16")]; tensor d_decoders_14_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46732544))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46994752))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_14_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_14_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46995840)))]; tensor linear_72_cast_fp16 = linear(bias = d_decoders_14_src_attn_linear_q_bias_to_fp16, weight = d_decoders_14_src_attn_linear_q_weight_to_fp16_quantized, x = x_207_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor var_1458 = const()[name = tensor("op_1458"), val = tensor([1, -1, 4, 128])]; tensor var_1459_cast_fp16 = reshape(shape = var_1458, x = linear_72_cast_fp16)[name = tensor("op_1459_cast_fp16")]; tensor d_decoders_14_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46996928))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47521280))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_14_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_14_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47523392)))]; tensor linear_73_cast_fp16 = linear(bias = d_decoders_14_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_14_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_73_cast_fp16")]; tensor tile_14 = const()[name = tensor("tile_14"), val = tensor([512, 512])]; tensor var_1464_axis_0 = const()[name = tensor("op_1464_axis_0"), val = tensor(-1)]; tensor var_1464_cast_fp16_0, tensor var_1464_cast_fp16_1 = split(axis = var_1464_axis_0, split_sizes = tile_14, x = linear_73_cast_fp16)[name = tensor("op_1464_cast_fp16")]; tensor var_1467 = const()[name = tensor("op_1467"), val = tensor([1, -1, 4, 128])]; tensor var_1468_cast_fp16 = reshape(shape = var_1467, x = var_1464_cast_fp16_0)[name = tensor("op_1468_cast_fp16")]; tensor var_1470 = const()[name = tensor("op_1470"), val = tensor([1, -1, 4, 128])]; tensor var_1471_cast_fp16 = reshape(shape = var_1470, x = var_1464_cast_fp16_1)[name = tensor("op_1471_cast_fp16")]; tensor value_29_perm_0 = const()[name = tensor("value_29_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1473_to_fp16 = const()[name = tensor("op_1473_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_59_cast_fp16 = mul(x = var_1459_cast_fp16, y = var_1473_to_fp16)[name = tensor("q_h_59_cast_fp16")]; tensor scores_57_transpose_x_0 = const()[name = tensor("scores_57_transpose_x_0"), val = tensor(false)]; tensor scores_57_transpose_y_0 = const()[name = tensor("scores_57_transpose_y_0"), val = tensor(false)]; tensor transpose_92_perm_0 = const()[name = tensor("transpose_92_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_93_perm_0 = const()[name = tensor("transpose_93_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_93 = transpose(perm = transpose_93_perm_0, x = var_1468_cast_fp16)[name = tensor("transpose_104")]; tensor transpose_92 = transpose(perm = transpose_92_perm_0, x = q_h_59_cast_fp16)[name = tensor("transpose_105")]; tensor scores_57_cast_fp16 = matmul(transpose_x = scores_57_transpose_x_0, transpose_y = scores_57_transpose_y_0, x = transpose_92, y = transpose_93)[name = tensor("scores_57_cast_fp16")]; tensor scores_59_cast_fp16 = select(a = var_8_to_fp16, b = scores_57_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_59_cast_fp16")]; tensor var_1481_cast_fp16 = softmax(axis = var_20, x = scores_59_cast_fp16)[name = tensor("op_1481_cast_fp16")]; tensor input_413_cast_fp16 = select(a = var_9_to_fp16, b = var_1481_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_413_cast_fp16")]; tensor x_209_transpose_x_0 = const()[name = tensor("x_209_transpose_x_0"), val = tensor(false)]; tensor x_209_transpose_y_0 = const()[name = tensor("x_209_transpose_y_0"), val = tensor(false)]; tensor value_29_cast_fp16 = transpose(perm = value_29_perm_0, x = var_1471_cast_fp16)[name = tensor("transpose_103")]; tensor x_209_cast_fp16 = matmul(transpose_x = x_209_transpose_x_0, transpose_y = x_209_transpose_y_0, x = input_413_cast_fp16, y = value_29_cast_fp16)[name = tensor("x_209_cast_fp16")]; tensor var_1485_perm_0 = const()[name = tensor("op_1485_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1487 = const()[name = tensor("op_1487"), val = tensor([1, -1, 512])]; tensor var_1485_cast_fp16 = transpose(perm = var_1485_perm_0, x = x_209_cast_fp16)[name = tensor("transpose_102")]; tensor input_415_cast_fp16 = reshape(shape = var_1487, x = var_1485_cast_fp16)[name = tensor("input_415_cast_fp16")]; tensor d_decoders_14_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_14_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47525504))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47787712))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_14_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_14_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47788800)))]; tensor linear_74_cast_fp16 = linear(bias = d_decoders_14_src_attn_linear_out_bias_to_fp16, weight = d_decoders_14_src_attn_linear_out_weight_to_fp16_quantized, x = input_415_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor input_419_cast_fp16 = add(x = input_411_cast_fp16, y = linear_74_cast_fp16)[name = tensor("input_419_cast_fp16")]; tensor input_421_axes_0 = const()[name = tensor("input_421_axes_0"), val = tensor([-1])]; tensor d_decoders_15_norm1_weight_to_fp16 = const()[name = tensor("d_decoders_15_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47789888)))]; tensor d_decoders_15_norm1_bias_to_fp16 = const()[name = tensor("d_decoders_15_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47790976)))]; tensor input_421_cast_fp16 = layer_norm(axes = input_421_axes_0, beta = d_decoders_15_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_15_norm1_weight_to_fp16, x = input_419_cast_fp16)[name = tensor("input_421_cast_fp16")]; tensor d_decoders_15_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47792064))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48840704))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders_15_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders_15_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48844864)))]; tensor linear_75_cast_fp16 = linear(bias = d_decoders_15_feed_forward_w_1_bias_to_fp16, weight = d_decoders_15_feed_forward_w_1_weight_to_fp16_quantized, x = input_421_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor input_425_cast_fp16 = relu(x = linear_75_cast_fp16)[name = tensor("input_425_cast_fp16")]; tensor input_429_axes_0 = const()[name = tensor("input_429_axes_0"), val = tensor([-1])]; tensor d_decoders_15_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders_15_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48849024)))]; tensor d_decoders_15_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders_15_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48853184)))]; tensor input_429_cast_fp16 = layer_norm(axes = input_429_axes_0, beta = d_decoders_15_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_15_feed_forward_norm_weight_to_fp16, x = input_425_cast_fp16)[name = tensor("input_429_cast_fp16")]; tensor d_decoders_15_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48857344))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49905984))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_76_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders_15_feed_forward_w_2_weight_to_fp16_quantized, x = input_429_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor inputs_61_axes_0 = const()[name = tensor("inputs_61_axes_0"), val = tensor([-1])]; tensor d_decoders_15_norm2_weight_to_fp16 = const()[name = tensor("d_decoders_15_norm2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49907072)))]; tensor d_decoders_15_norm2_bias_to_fp16 = const()[name = tensor("d_decoders_15_norm2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49908160)))]; tensor inputs_61_cast_fp16 = layer_norm(axes = inputs_61_axes_0, beta = d_decoders_15_norm2_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_15_norm2_weight_to_fp16, x = linear_76_cast_fp16)[name = tensor("inputs_61_cast_fp16")]; tensor inputs_cast_fp16 = mul(x = inputs_61_cast_fp16, y = mask_9_cast_fp16)[name = tensor("inputs_cast_fp16")]; tensor x_211_perm_0 = const()[name = tensor("x_211_perm_0"), val = tensor([0, 2, 1])]; tensor input_433_pad_0 = const()[name = tensor("input_433_pad_0"), val = tensor([0, 0, 0, 0, 5, 5])]; tensor input_433_mode_0 = const()[name = tensor("input_433_mode_0"), val = tensor("constant")]; tensor const_95_to_fp16 = const()[name = tensor("const_95_to_fp16"), val = tensor(0x0p+0)]; tensor x_211_cast_fp16 = transpose(perm = x_211_perm_0, x = inputs_cast_fp16)[name = tensor("transpose_101")]; tensor input_433_cast_fp16 = pad(constant_val = const_95_to_fp16, mode = input_433_mode_0, pad = input_433_pad_0, x = x_211_cast_fp16)[name = tensor("input_433_cast_fp16")]; tensor x_213_pad_type_0 = const()[name = tensor("x_213_pad_type_0"), val = tensor("valid")]; tensor x_213_groups_0 = const()[name = tensor("x_213_groups_0"), val = tensor(512)]; tensor x_213_strides_0 = const()[name = tensor("x_213_strides_0"), val = tensor([1])]; tensor x_213_pad_0 = const()[name = tensor("x_213_pad_0"), val = tensor([0, 0])]; tensor x_213_dilations_0 = const()[name = tensor("x_213_dilations_0"), val = tensor([1])]; tensor d_decoders_15_self_attn_fsmn_block_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_self_attn_fsmn_block_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49909248))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49914944))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor x_213_cast_fp16 = conv(dilations = x_213_dilations_0, groups = x_213_groups_0, pad = x_213_pad_0, pad_type = x_213_pad_type_0, strides = x_213_strides_0, weight = d_decoders_15_self_attn_fsmn_block_weight_to_fp16_quantized, x = input_433_cast_fp16)[name = tensor("x_213_cast_fp16")]; tensor x_215_perm_0 = const()[name = tensor("x_215_perm_0"), val = tensor([0, 2, 1])]; tensor x_215_cast_fp16 = transpose(perm = x_215_perm_0, x = x_213_cast_fp16)[name = tensor("transpose_100")]; tensor input_435_cast_fp16 = add(x = x_215_cast_fp16, y = inputs_cast_fp16)[name = tensor("input_435_cast_fp16")]; tensor input_437_cast_fp16 = mul(x = input_435_cast_fp16, y = mask_9_cast_fp16)[name = tensor("input_437_cast_fp16")]; tensor input_439_cast_fp16 = add(x = input_419_cast_fp16, y = input_437_cast_fp16)[name = tensor("input_439_cast_fp16")]; tensor x_221_axes_0 = const()[name = tensor("x_221_axes_0"), val = tensor([-1])]; tensor d_decoders_15_norm3_weight_to_fp16 = const()[name = tensor("d_decoders_15_norm3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49916032)))]; tensor d_decoders_15_norm3_bias_to_fp16 = const()[name = tensor("d_decoders_15_norm3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49917120)))]; tensor x_221_cast_fp16 = layer_norm(axes = x_221_axes_0, beta = d_decoders_15_norm3_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders_15_norm3_weight_to_fp16, x = input_439_cast_fp16)[name = tensor("x_221_cast_fp16")]; tensor d_decoders_15_src_attn_linear_q_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_src_attn_linear_q_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49918208))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50180416))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_15_src_attn_linear_q_bias_to_fp16 = const()[name = tensor("d_decoders_15_src_attn_linear_q_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50181504)))]; tensor linear_77_cast_fp16 = linear(bias = d_decoders_15_src_attn_linear_q_bias_to_fp16, weight = d_decoders_15_src_attn_linear_q_weight_to_fp16_quantized, x = x_221_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor var_1553 = const()[name = tensor("op_1553"), val = tensor([1, -1, 4, 128])]; tensor var_1554_cast_fp16 = reshape(shape = var_1553, x = linear_77_cast_fp16)[name = tensor("op_1554_cast_fp16")]; tensor d_decoders_15_src_attn_linear_k_v_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_src_attn_linear_k_v_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50182592))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50706944))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2920896)))]; tensor d_decoders_15_src_attn_linear_k_v_bias_to_fp16 = const()[name = tensor("d_decoders_15_src_attn_linear_k_v_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50709056)))]; tensor linear_78_cast_fp16 = linear(bias = d_decoders_15_src_attn_linear_k_v_bias_to_fp16, weight = d_decoders_15_src_attn_linear_k_v_weight_to_fp16_quantized, x = enc_to_fp16)[name = tensor("linear_78_cast_fp16")]; tensor tile_15 = const()[name = tensor("tile_15"), val = tensor([512, 512])]; tensor var_1559_axis_0 = const()[name = tensor("op_1559_axis_0"), val = tensor(-1)]; tensor var_1559_cast_fp16_0, tensor var_1559_cast_fp16_1 = split(axis = var_1559_axis_0, split_sizes = tile_15, x = linear_78_cast_fp16)[name = tensor("op_1559_cast_fp16")]; tensor var_1562 = const()[name = tensor("op_1562"), val = tensor([1, -1, 4, 128])]; tensor var_1563_cast_fp16 = reshape(shape = var_1562, x = var_1559_cast_fp16_0)[name = tensor("op_1563_cast_fp16")]; tensor var_1565 = const()[name = tensor("op_1565"), val = tensor([1, -1, 4, 128])]; tensor var_1566_cast_fp16 = reshape(shape = var_1565, x = var_1559_cast_fp16_1)[name = tensor("op_1566_cast_fp16")]; tensor value_perm_0 = const()[name = tensor("value_perm_0"), val = tensor([0, 2, -3, -1])]; tensor var_1568_to_fp16 = const()[name = tensor("op_1568_to_fp16"), val = tensor(0x1.6ap-4)]; tensor q_h_cast_fp16 = mul(x = var_1554_cast_fp16, y = var_1568_to_fp16)[name = tensor("q_h_cast_fp16")]; tensor scores_61_transpose_x_0 = const()[name = tensor("scores_61_transpose_x_0"), val = tensor(false)]; tensor scores_61_transpose_y_0 = const()[name = tensor("scores_61_transpose_y_0"), val = tensor(false)]; tensor transpose_94_perm_0 = const()[name = tensor("transpose_94_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_95_perm_0 = const()[name = tensor("transpose_95_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_95 = transpose(perm = transpose_95_perm_0, x = var_1563_cast_fp16)[name = tensor("transpose_98")]; tensor transpose_94 = transpose(perm = transpose_94_perm_0, x = q_h_cast_fp16)[name = tensor("transpose_99")]; tensor scores_61_cast_fp16 = matmul(transpose_x = scores_61_transpose_x_0, transpose_y = scores_61_transpose_y_0, x = transpose_94, y = transpose_95)[name = tensor("scores_61_cast_fp16")]; tensor scores_cast_fp16 = select(a = var_8_to_fp16, b = scores_61_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("scores_cast_fp16")]; tensor var_1576_cast_fp16 = softmax(axis = var_20, x = scores_cast_fp16)[name = tensor("op_1576_cast_fp16")]; tensor input_441_cast_fp16 = select(a = var_9_to_fp16, b = var_1576_cast_fp16, cond = mask_15_cast_fp16)[name = tensor("input_441_cast_fp16")]; tensor x_transpose_x_0 = const()[name = tensor("x_transpose_x_0"), val = tensor(false)]; tensor x_transpose_y_0 = const()[name = tensor("x_transpose_y_0"), val = tensor(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = var_1566_cast_fp16)[name = tensor("transpose_97")]; tensor x_cast_fp16 = matmul(transpose_x = x_transpose_x_0, transpose_y = x_transpose_y_0, x = input_441_cast_fp16, y = value_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_1580_perm_0 = const()[name = tensor("op_1580_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1582 = const()[name = tensor("op_1582"), val = tensor([1, -1, 512])]; tensor var_1580_cast_fp16 = transpose(perm = var_1580_perm_0, x = x_cast_fp16)[name = tensor("transpose_96")]; tensor input_443_cast_fp16 = reshape(shape = var_1582, x = var_1580_cast_fp16)[name = tensor("input_443_cast_fp16")]; tensor d_decoders_15_src_attn_linear_out_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders_15_src_attn_linear_out_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50711168))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50973376))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor d_decoders_15_src_attn_linear_out_bias_to_fp16 = const()[name = tensor("d_decoders_15_src_attn_linear_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50974464)))]; tensor linear_79_cast_fp16 = linear(bias = d_decoders_15_src_attn_linear_out_bias_to_fp16, weight = d_decoders_15_src_attn_linear_out_weight_to_fp16_quantized, x = input_443_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor input_447_cast_fp16 = add(x = input_439_cast_fp16, y = linear_79_cast_fp16)[name = tensor("input_447_cast_fp16")]; tensor input_449_axes_0 = const()[name = tensor("input_449_axes_0"), val = tensor([-1])]; tensor d_decoders3_0_norm1_weight_to_fp16 = const()[name = tensor("d_decoders3_0_norm1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50975552)))]; tensor d_decoders3_0_norm1_bias_to_fp16 = const()[name = tensor("d_decoders3_0_norm1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50976640)))]; tensor input_449_cast_fp16 = layer_norm(axes = input_449_axes_0, beta = d_decoders3_0_norm1_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders3_0_norm1_weight_to_fp16, x = input_447_cast_fp16)[name = tensor("input_449_cast_fp16")]; tensor d_decoders3_0_feed_forward_w_1_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders3_0_feed_forward_w_1_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50977728))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52026368))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050880)))]; tensor d_decoders3_0_feed_forward_w_1_bias_to_fp16 = const()[name = tensor("d_decoders3_0_feed_forward_w_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52030528)))]; tensor linear_80_cast_fp16 = linear(bias = d_decoders3_0_feed_forward_w_1_bias_to_fp16, weight = d_decoders3_0_feed_forward_w_1_weight_to_fp16_quantized, x = input_449_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor input_453_cast_fp16 = relu(x = linear_80_cast_fp16)[name = tensor("input_453_cast_fp16")]; tensor input_457_axes_0 = const()[name = tensor("input_457_axes_0"), val = tensor([-1])]; tensor d_decoders3_0_feed_forward_norm_weight_to_fp16 = const()[name = tensor("d_decoders3_0_feed_forward_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52034688)))]; tensor d_decoders3_0_feed_forward_norm_bias_to_fp16 = const()[name = tensor("d_decoders3_0_feed_forward_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52038848)))]; tensor input_457_cast_fp16 = layer_norm(axes = input_457_axes_0, beta = d_decoders3_0_feed_forward_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_decoders3_0_feed_forward_norm_weight_to_fp16, x = input_453_cast_fp16)[name = tensor("input_457_cast_fp16")]; tensor d_decoders3_0_feed_forward_w_2_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_decoders3_0_feed_forward_w_2_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(52043008))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53091648))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2118272)))]; tensor linear_81_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = d_decoders3_0_feed_forward_w_2_weight_to_fp16_quantized, x = input_457_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor input_axes_0 = const()[name = tensor("input_axes_0"), val = tensor([-1])]; tensor d_after_norm_weight_to_fp16 = const()[name = tensor("d_after_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53092736)))]; tensor d_after_norm_bias_to_fp16 = const()[name = tensor("d_after_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53093824)))]; tensor input_cast_fp16 = layer_norm(axes = input_axes_0, beta = d_after_norm_bias_to_fp16, epsilon = var_15_to_fp16, gamma = d_after_norm_weight_to_fp16, x = linear_81_cast_fp16)[name = tensor("input_cast_fp16")]; tensor d_output_layer_weight_to_fp16_quantized = constexpr_affine_dequantize()[axis = tensor(0), name = tensor("d_output_layer_weight_to_fp16_quantized"), quantized_data = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53094912))), scale = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57406336))), zero_point = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57397824)))]; tensor d_output_layer_bias_to_fp16 = const()[name = tensor("d_output_layer_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57423232)))]; tensor logits = linear(bias = d_output_layer_bias_to_fp16, weight = d_output_layer_weight_to_fp16_quantized, x = input_cast_fp16)[name = tensor("linear_82_cast_fp16")]; } -> (logits); }