program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3500.14.1"}, {"coremlc-version", "3500.32.1"}, {"coremltools-component-torch", "2.4.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.3.0"}})] { func main(tensor audio_length, tensor audio_signal, tensor cache_last_channel, tensor cache_last_channel_len, tensor cache_last_time, tensor pre_cache) { tensor var_9 = const()[name = tensor("op_9"), val = tensor(2)]; tensor full_input_interleave_0 = const()[name = tensor("full_input_interleave_0"), val = tensor(false)]; tensor pre_cache_to_fp16_dtype_0 = const()[name = tensor("pre_cache_to_fp16_dtype_0"), val = tensor("fp16")]; tensor audio_signal_to_fp16_dtype_0 = const()[name = tensor("audio_signal_to_fp16_dtype_0"), val = tensor("fp16")]; tensor audio_signal_to_fp16 = cast(dtype = audio_signal_to_fp16_dtype_0, x = audio_signal)[name = tensor("cast_195")]; tensor pre_cache_to_fp16 = cast(dtype = pre_cache_to_fp16_dtype_0, x = pre_cache)[name = tensor("cast_196")]; tensor full_input_cast_fp16 = concat(axis = var_9, interleave = full_input_interleave_0, values = (pre_cache_to_fp16, audio_signal_to_fp16))[name = tensor("full_input_cast_fp16")]; tensor var_12 = const()[name = tensor("op_12"), val = tensor(16)]; tensor value_1 = add(x = audio_length, y = var_12)[name = tensor("value_1")]; tensor var_28_begin_0 = const()[name = tensor("op_28_begin_0"), val = tensor([0, 0, 17])]; tensor var_28_end_0 = const()[name = tensor("op_28_end_0"), val = tensor([1, 128, 33])]; tensor var_28_end_mask_0 = const()[name = tensor("op_28_end_mask_0"), val = tensor([true, true, true])]; tensor var_28_cast_fp16 = slice_by_index(begin = var_28_begin_0, end = var_28_end_0, end_mask = var_28_end_mask_0, x = full_input_cast_fp16)[name = tensor("op_28_cast_fp16")]; tensor var_28_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_28_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_62 = const()[name = tensor("op_62"), val = tensor(-1)]; tensor var_64 = const()[name = tensor("op_64"), val = tensor(1)]; tensor x_1_perm_0 = const()[name = tensor("x_1_perm_0"), val = tensor([0, 2, 1])]; tensor cast_0_to_fp16_dtype_0 = const()[name = tensor("cast_0_to_fp16_dtype_0"), val = tensor("fp16")]; tensor _inversed_108_y_0_to_fp16 = const()[name = tensor("_inversed_108_y_0_to_fp16"), val = tensor(0x1p-1)]; tensor value_1_to_fp16 = cast(dtype = cast_0_to_fp16_dtype_0, x = value_1)[name = tensor("cast_193")]; tensor _inversed_108_cast_fp16 = mul(x = value_1_to_fp16, y = _inversed_108_y_0_to_fp16)[name = tensor("_inversed_108_cast_fp16")]; tensor var_109_to_fp16 = const()[name = tensor("op_109_to_fp16"), val = tensor(0x1p+0)]; tensor lengths_1_cast_fp16 = add(x = _inversed_108_cast_fp16, y = var_109_to_fp16)[name = tensor("lengths_1_cast_fp16")]; tensor lengths_3_cast_fp16 = floor(x = lengths_1_cast_fp16)[name = tensor("lengths_3_cast_fp16")]; tensor _inversed_116_y_0_to_fp16 = const()[name = tensor("_inversed_116_y_0_to_fp16"), val = tensor(0x1p-1)]; tensor _inversed_116_cast_fp16 = mul(x = lengths_3_cast_fp16, y = _inversed_116_y_0_to_fp16)[name = tensor("_inversed_116_cast_fp16")]; tensor var_117_to_fp16 = const()[name = tensor("op_117_to_fp16"), val = tensor(0x1p+0)]; tensor lengths_7_cast_fp16 = add(x = _inversed_116_cast_fp16, y = var_117_to_fp16)[name = tensor("lengths_7_cast_fp16")]; tensor lengths_9_cast_fp16 = floor(x = lengths_7_cast_fp16)[name = tensor("lengths_9_cast_fp16")]; tensor _inversed_124_y_0_to_fp16 = const()[name = tensor("_inversed_124_y_0_to_fp16"), val = tensor(0x1p-1)]; tensor _inversed_124_cast_fp16 = mul(x = lengths_9_cast_fp16, y = _inversed_124_y_0_to_fp16)[name = tensor("_inversed_124_cast_fp16")]; tensor var_125_to_fp16 = const()[name = tensor("op_125_to_fp16"), val = tensor(0x1p+0)]; tensor lengths_13_cast_fp16 = add(x = _inversed_124_cast_fp16, y = var_125_to_fp16)[name = tensor("lengths_13_cast_fp16")]; tensor lengths_cast_fp16 = floor(x = lengths_13_cast_fp16)[name = tensor("lengths_cast_fp16")]; tensor cast_9_dtype_0 = const()[name = tensor("cast_9_dtype_0"), val = tensor("int32")]; tensor input_1_axes_0 = const()[name = tensor("input_1_axes_0"), val = tensor([1])]; tensor x_1_cast_fp16 = transpose(perm = x_1_perm_0, x = full_input_cast_fp16)[name = tensor("transpose_241")]; tensor input_1_cast_fp16 = expand_dims(axes = input_1_axes_0, x = x_1_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor input_3_pad_0 = const()[name = tensor("input_3_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_3_mode_0 = const()[name = tensor("input_3_mode_0"), val = tensor("constant")]; tensor const_0_to_fp16 = const()[name = tensor("const_0_to_fp16"), val = tensor(0x0p+0)]; tensor input_3_cast_fp16 = pad(constant_val = const_0_to_fp16, mode = input_3_mode_0, pad = input_3_pad_0, x = input_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor input_5_pad_type_0 = const()[name = tensor("input_5_pad_type_0"), val = tensor("valid")]; tensor input_5_strides_0 = const()[name = tensor("input_5_strides_0"), val = tensor([2, 2])]; tensor input_5_pad_0 = const()[name = tensor("input_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_5_dilations_0 = const()[name = tensor("input_5_dilations_0"), val = tensor([1, 1])]; tensor input_5_groups_0 = const()[name = tensor("input_5_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_0_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor encoder_pre_encode_conv_0_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4736)))]; tensor input_5_cast_fp16 = conv(bias = encoder_pre_encode_conv_0_bias_to_fp16, dilations = input_5_dilations_0, groups = input_5_groups_0, pad = input_5_pad_0, pad_type = input_5_pad_type_0, strides = input_5_strides_0, weight = encoder_pre_encode_conv_0_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor input_7_cast_fp16 = relu(x = input_5_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_pad_0 = const()[name = tensor("input_9_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_9_mode_0 = const()[name = tensor("input_9_mode_0"), val = tensor("constant")]; tensor const_1_to_fp16 = const()[name = tensor("const_1_to_fp16"), val = tensor(0x0p+0)]; tensor input_9_cast_fp16 = pad(constant_val = const_1_to_fp16, mode = input_9_mode_0, pad = input_9_pad_0, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor input_11_pad_type_0 = const()[name = tensor("input_11_pad_type_0"), val = tensor("valid")]; tensor input_11_strides_0 = const()[name = tensor("input_11_strides_0"), val = tensor([2, 2])]; tensor input_11_groups_0 = const()[name = tensor("input_11_groups_0"), val = tensor(256)]; tensor input_11_pad_0 = const()[name = tensor("input_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_11_dilations_0 = const()[name = tensor("input_11_dilations_0"), val = tensor([1, 1])]; tensor encoder_pre_encode_conv_2_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5312)))]; tensor encoder_pre_encode_conv_2_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9984)))]; tensor input_11_cast_fp16 = conv(bias = encoder_pre_encode_conv_2_bias_to_fp16, dilations = input_11_dilations_0, groups = input_11_groups_0, pad = input_11_pad_0, pad_type = input_11_pad_type_0, strides = input_11_strides_0, weight = encoder_pre_encode_conv_2_weight_to_fp16, x = input_9_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor input_13_pad_type_0 = const()[name = tensor("input_13_pad_type_0"), val = tensor("valid")]; tensor input_13_strides_0 = const()[name = tensor("input_13_strides_0"), val = tensor([1, 1])]; tensor input_13_pad_0 = const()[name = tensor("input_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_13_dilations_0 = const()[name = tensor("input_13_dilations_0"), val = tensor([1, 1])]; tensor input_13_groups_0 = const()[name = tensor("input_13_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_3_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_3_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10560)))]; tensor encoder_pre_encode_conv_3_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_3_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141696)))]; tensor input_13_cast_fp16 = conv(bias = encoder_pre_encode_conv_3_bias_to_fp16, dilations = input_13_dilations_0, groups = input_13_groups_0, pad = input_13_pad_0, pad_type = input_13_pad_type_0, strides = input_13_strides_0, weight = encoder_pre_encode_conv_3_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor input_15_cast_fp16 = relu(x = input_13_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor input_17_pad_0 = const()[name = tensor("input_17_pad_0"), val = tensor([0, 0, 0, 0, 2, 1, 2, 1])]; tensor input_17_mode_0 = const()[name = tensor("input_17_mode_0"), val = tensor("constant")]; tensor const_2_to_fp16 = const()[name = tensor("const_2_to_fp16"), val = tensor(0x0p+0)]; tensor input_17_cast_fp16 = pad(constant_val = const_2_to_fp16, mode = input_17_mode_0, pad = input_17_pad_0, x = input_15_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_pad_type_0 = const()[name = tensor("input_19_pad_type_0"), val = tensor("valid")]; tensor input_19_strides_0 = const()[name = tensor("input_19_strides_0"), val = tensor([2, 2])]; tensor input_19_groups_0 = const()[name = tensor("input_19_groups_0"), val = tensor(256)]; tensor input_19_pad_0 = const()[name = tensor("input_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_19_dilations_0 = const()[name = tensor("input_19_dilations_0"), val = tensor([1, 1])]; tensor encoder_pre_encode_conv_5_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_5_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142272)))]; tensor encoder_pre_encode_conv_5_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_5_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146944)))]; tensor input_19_cast_fp16 = conv(bias = encoder_pre_encode_conv_5_bias_to_fp16, dilations = input_19_dilations_0, groups = input_19_groups_0, pad = input_19_pad_0, pad_type = input_19_pad_type_0, strides = input_19_strides_0, weight = encoder_pre_encode_conv_5_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_pad_type_0 = const()[name = tensor("input_21_pad_type_0"), val = tensor("valid")]; tensor input_21_strides_0 = const()[name = tensor("input_21_strides_0"), val = tensor([1, 1])]; tensor input_21_pad_0 = const()[name = tensor("input_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_21_dilations_0 = const()[name = tensor("input_21_dilations_0"), val = tensor([1, 1])]; tensor input_21_groups_0 = const()[name = tensor("input_21_groups_0"), val = tensor(1)]; tensor encoder_pre_encode_conv_6_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_6_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(147520)))]; tensor encoder_pre_encode_conv_6_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_conv_6_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278656)))]; tensor input_21_cast_fp16 = conv(bias = encoder_pre_encode_conv_6_bias_to_fp16, dilations = input_21_dilations_0, groups = input_21_groups_0, pad = input_21_pad_0, pad_type = input_21_pad_type_0, strides = input_21_strides_0, weight = encoder_pre_encode_conv_6_weight_to_fp16, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor x_3_cast_fp16 = relu(x = input_21_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_181_perm_0 = const()[name = tensor("op_181_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_182 = const()[name = tensor("op_182"), val = tensor([1, 5, -1])]; tensor var_181_cast_fp16 = transpose(perm = var_181_perm_0, x = x_3_cast_fp16)[name = tensor("transpose_240")]; tensor input_23_cast_fp16 = reshape(shape = var_182, x = var_181_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor encoder_pre_encode_out_weight_to_fp16 = const()[name = tensor("encoder_pre_encode_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279232)))]; tensor encoder_pre_encode_out_bias_to_fp16 = const()[name = tensor("encoder_pre_encode_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4735744)))]; tensor linear_0_cast_fp16 = linear(bias = encoder_pre_encode_out_bias_to_fp16, weight = encoder_pre_encode_out_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_192_begin_0 = const()[name = tensor("op_192_begin_0"), val = tensor([0, 2, 0])]; tensor var_192_end_0 = const()[name = tensor("op_192_end_0"), val = tensor([1, 5, 512])]; tensor var_192_end_mask_0 = const()[name = tensor("op_192_end_mask_0"), val = tensor([true, true, true])]; tensor var_192_cast_fp16 = slice_by_index(begin = var_192_begin_0, end = var_192_end_0, end_mask = var_192_end_mask_0, x = linear_0_cast_fp16)[name = tensor("op_192_cast_fp16")]; tensor var_194 = const()[name = tensor("op_194"), val = tensor(2)]; tensor lengths_cast_fp16_to_int32 = cast(dtype = cast_9_dtype_0, x = lengths_cast_fp16)[name = tensor("cast_192")]; tensor var_195 = sub(x = lengths_cast_fp16_to_int32, y = var_194)[name = tensor("op_195")]; tensor var_195_promoted_to_fp16_dtype_0 = const()[name = tensor("op_195_promoted_to_fp16_dtype_0"), val = tensor("fp16")]; tensor var_60_promoted_to_fp16 = const()[name = tensor("op_60_promoted_to_fp16"), val = tensor(0x0p+0)]; tensor const_5_to_fp16 = const()[name = tensor("const_5_to_fp16"), val = tensor(inf)]; tensor var_195_to_fp16 = cast(dtype = var_195_promoted_to_fp16_dtype_0, x = var_195)[name = tensor("cast_191")]; tensor clip_0_cast_fp16 = clip(alpha = var_60_promoted_to_fp16, beta = const_5_to_fp16, x = var_195_to_fp16)[name = tensor("clip_0_cast_fp16")]; tensor cache_keep_size = const()[name = tensor("cache_keep_size"), val = tensor([1])]; tensor var_211_promoted_to_fp16 = const()[name = tensor("op_211_promoted_to_fp16"), val = tensor(0x1.18p+6)]; tensor padding_length_cast_fp16 = add(x = clip_0_cast_fp16, y = var_211_promoted_to_fp16)[name = tensor("padding_length_cast_fp16")]; tensor const_7 = const()[name = tensor("const_7"), val = tensor(-1)]; tensor var_213 = mul(x = cache_last_channel_len, y = const_7)[name = tensor("op_213")]; tensor var_214 = const()[name = tensor("op_214"), val = tensor(70)]; tensor offset = add(x = var_213, y = var_214)[name = tensor("offset")]; tensor var_254_axes_0 = const()[name = tensor("op_254_axes_0"), val = tensor([-1])]; tensor var_254_cast_fp16 = expand_dims(axes = var_254_axes_0, x = padding_length_cast_fp16)[name = tensor("op_254_cast_fp16")]; tensor var_253_promoted_to_fp16 = const()[name = tensor("op_253_promoted_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4736832)))]; tensor pad_mask_1_cast_fp16 = less(x = var_253_promoted_to_fp16, y = var_254_cast_fp16)[name = tensor("pad_mask_1_cast_fp16")]; tensor expand_dims_1 = const()[name = tensor("expand_dims_1"), val = tensor([[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72]])]; tensor var_260_axes_0 = const()[name = tensor("op_260_axes_0"), val = tensor([-1])]; tensor var_260 = expand_dims(axes = var_260_axes_0, x = offset)[name = tensor("op_260")]; tensor pad_mask_off = greater_equal(x = expand_dims_1, y = var_260)[name = tensor("pad_mask_off")]; tensor pad_mask_3 = logical_and(x = pad_mask_off, y = pad_mask_1_cast_fp16)[name = tensor("pad_mask_3")]; tensor var_263_axes_0 = const()[name = tensor("op_263_axes_0"), val = tensor([1])]; tensor var_263 = expand_dims(axes = var_263_axes_0, x = pad_mask_3)[name = tensor("op_263")]; tensor var_264 = const()[name = tensor("op_264"), val = tensor([1, 73, 1])]; tensor pad_mask_for_att_mask_1 = tile(reps = var_264, x = var_263)[name = tensor("pad_mask_for_att_mask_1")]; tensor var_266_perm_0 = const()[name = tensor("op_266_perm_0"), val = tensor([0, 2, 1])]; tensor var_266 = transpose(perm = var_266_perm_0, x = pad_mask_for_att_mask_1)[name = tensor("transpose_239")]; tensor pad_mask_for_att_mask = logical_and(x = pad_mask_for_att_mask_1, y = var_266)[name = tensor("pad_mask_for_att_mask")]; tensor const_15 = const()[name = tensor("const_15"), val = tensor([[[true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false, false, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false], [true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, false], [false, false, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true, true]]])]; tensor att_mask_9 = logical_and(x = pad_mask_for_att_mask, y = const_15)[name = tensor("att_mask_9")]; tensor att_mask = logical_not(x = att_mask_9)[name = tensor("att_mask")]; tensor pad_mask_5 = logical_not(x = pad_mask_3)[name = tensor("pad_mask_5")]; tensor pad_mask_begin_0 = const()[name = tensor("pad_mask_begin_0"), val = tensor([0, 70])]; tensor pad_mask_end_0 = const()[name = tensor("pad_mask_end_0"), val = tensor([1, 73])]; tensor pad_mask_end_mask_0 = const()[name = tensor("pad_mask_end_mask_0"), val = tensor([true, true])]; tensor pad_mask = slice_by_index(begin = pad_mask_begin_0, end = pad_mask_end_0, end_mask = pad_mask_end_mask_0, x = pad_mask_5)[name = tensor("pad_mask")]; tensor mask_1_begin_0 = const()[name = tensor("mask_1_begin_0"), val = tensor([0, 70, 0])]; tensor mask_1_end_0 = const()[name = tensor("mask_1_end_0"), val = tensor([1, 73, 73])]; tensor mask_1_end_mask_0 = const()[name = tensor("mask_1_end_mask_0"), val = tensor([true, true, true])]; tensor mask_1 = slice_by_index(begin = mask_1_begin_0, end = mask_1_end_0, end_mask = mask_1_end_mask_0, x = att_mask)[name = tensor("mask_1")]; tensor cache_1_begin_0 = const()[name = tensor("cache_1_begin_0"), val = tensor([0, 0, 0, 0])]; tensor cache_1_end_0 = const()[name = tensor("cache_1_end_0"), val = tensor([1, 1, 70, 512])]; tensor cache_1_end_mask_0 = const()[name = tensor("cache_1_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_1_squeeze_mask_0 = const()[name = tensor("cache_1_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_last_channel_to_fp16_dtype_0 = const()[name = tensor("cache_last_channel_to_fp16_dtype_0"), val = tensor("fp16")]; tensor cache_last_channel_to_fp16 = cast(dtype = cache_last_channel_to_fp16_dtype_0, x = cache_last_channel)[name = tensor("cast_190")]; tensor cache_1_cast_fp16 = slice_by_index(begin = cache_1_begin_0, end = cache_1_end_0, end_mask = cache_1_end_mask_0, squeeze_mask = cache_1_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_1_cast_fp16")]; tensor cache_3_begin_0 = const()[name = tensor("cache_3_begin_0"), val = tensor([0, 0, 0, 0])]; tensor cache_3_end_0 = const()[name = tensor("cache_3_end_0"), val = tensor([1, 1, 512, 8])]; tensor cache_3_end_mask_0 = const()[name = tensor("cache_3_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_3_squeeze_mask_0 = const()[name = tensor("cache_3_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_last_time_to_fp16_dtype_0 = const()[name = tensor("cache_last_time_to_fp16_dtype_0"), val = tensor("fp16")]; tensor cache_last_time_to_fp16 = cast(dtype = cache_last_time_to_fp16_dtype_0, x = cache_last_time)[name = tensor("cast_189")]; tensor cache_3_cast_fp16 = slice_by_index(begin = cache_3_begin_0, end = cache_3_end_0, end_mask = cache_3_end_mask_0, squeeze_mask = cache_3_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_3_cast_fp16")]; tensor input_27_axes_0 = const()[name = tensor("input_27_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4737088)))]; tensor encoder_layers_0_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4738176)))]; tensor var_38_to_fp16 = const()[name = tensor("op_38_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_27_cast_fp16 = layer_norm(axes = input_27_axes_0, beta = encoder_layers_0_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_norm_feed_forward1_weight_to_fp16, x = var_192_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor encoder_layers_0_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4739264)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6836480)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_0_feed_forward1_linear1_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor input_31_cast_fp16 = silu(x = linear_1_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor encoder_layers_0_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6840640)))]; tensor linear_2_bias_0_to_fp16 = const()[name = tensor("linear_2_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8937856)))]; tensor linear_2_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_feed_forward1_linear2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_303_to_fp16 = const()[name = tensor("op_303_to_fp16"), val = tensor(0x1p-1)]; tensor var_304_cast_fp16 = mul(x = linear_2_cast_fp16, y = var_303_to_fp16)[name = tensor("op_304_cast_fp16")]; tensor input_37_cast_fp16 = add(x = var_192_cast_fp16, y = var_304_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor key_1_axes_0 = const()[name = tensor("key_1_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8938944)))]; tensor encoder_layers_0_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8940032)))]; tensor key_1_cast_fp16 = layer_norm(axes = key_1_axes_0, beta = encoder_layers_0_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_norm_self_att_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("key_1_cast_fp16")]; tensor input_39_interleave_0 = const()[name = tensor("input_39_interleave_0"), val = tensor(false)]; tensor input_39_cast_fp16 = concat(axis = var_64, interleave = input_39_interleave_0, values = (cache_1_cast_fp16, key_1_cast_fp16))[name = tensor("input_39_cast_fp16")]; tensor var_326_begin_0 = const()[name = tensor("op_326_begin_0"), val = tensor([0, 1, 0])]; tensor var_326_end_0 = const()[name = tensor("op_326_end_0"), val = tensor([1, 70, 512])]; tensor var_326_end_mask_0 = const()[name = tensor("op_326_end_mask_0"), val = tensor([true, true, true])]; tensor var_326_cast_fp16 = slice_by_index(begin = var_326_begin_0, end = var_326_end_0, end_mask = var_326_end_mask_0, x = cache_1_cast_fp16)[name = tensor("op_326_cast_fp16")]; tensor var_329_begin_0 = const()[name = tensor("op_329_begin_0"), val = tensor([0, 0, 0])]; tensor var_329_end_0 = const()[name = tensor("op_329_end_0"), val = tensor([1, 1, 512])]; tensor var_329_end_mask_0 = const()[name = tensor("op_329_end_mask_0"), val = tensor([true, false, true])]; tensor var_329_cast_fp16 = slice_by_index(begin = var_329_begin_0, end = var_329_end_0, end_mask = var_329_end_mask_0, x = key_1_cast_fp16)[name = tensor("op_329_cast_fp16")]; tensor var_332_interleave_0 = const()[name = tensor("op_332_interleave_0"), val = tensor(false)]; tensor var_332_cast_fp16 = concat(axis = var_64, interleave = var_332_interleave_0, values = (var_326_cast_fp16, var_329_cast_fp16))[name = tensor("op_332_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8941120)))]; tensor linear_3_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_self_attn_linear_q_weight_to_fp16, x = key_1_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor var_336 = const()[name = tensor("op_336"), val = tensor([1, -1, 8, 64])]; tensor q_1_cast_fp16 = reshape(shape = var_336, x = linear_3_cast_fp16)[name = tensor("q_1_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9465472)))]; tensor linear_4_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_self_attn_linear_k_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor var_340 = const()[name = tensor("op_340"), val = tensor([1, -1, 8, 64])]; tensor k_1_cast_fp16 = reshape(shape = var_340, x = linear_4_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9989824)))]; tensor linear_5_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_self_attn_linear_v_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_344 = const()[name = tensor("op_344"), val = tensor([1, -1, 8, 64])]; tensor v_1_cast_fp16 = reshape(shape = var_344, x = linear_5_cast_fp16)[name = tensor("v_1_cast_fp16")]; tensor value_3_perm_0 = const()[name = tensor("value_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_0_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10514176)))]; tensor var_356_cast_fp16 = add(x = q_1_cast_fp16, y = encoder_layers_0_self_attn_pos_bias_u_to_fp16)[name = tensor("op_356_cast_fp16")]; tensor encoder_layers_0_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10515264)))]; tensor var_358_cast_fp16 = add(x = q_1_cast_fp16, y = encoder_layers_0_self_attn_pos_bias_v_to_fp16)[name = tensor("op_358_cast_fp16")]; tensor q_with_bias_v_1_perm_0 = const()[name = tensor("q_with_bias_v_1_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_7_transpose_x_0 = const()[name = tensor("x_7_transpose_x_0"), val = tensor(false)]; tensor x_7_transpose_y_0 = const()[name = tensor("x_7_transpose_y_0"), val = tensor(false)]; tensor var_360_to_fp16 = const()[name = tensor("op_360_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10516352)))]; tensor q_with_bias_v_1_cast_fp16 = transpose(perm = q_with_bias_v_1_perm_0, x = var_358_cast_fp16)[name = tensor("transpose_237")]; tensor x_7_cast_fp16 = matmul(transpose_x = x_7_transpose_x_0, transpose_y = x_7_transpose_y_0, x = q_with_bias_v_1_cast_fp16, y = var_360_to_fp16)[name = tensor("x_7_cast_fp16")]; tensor x_9_pad_0 = const()[name = tensor("x_9_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_9_mode_0 = const()[name = tensor("x_9_mode_0"), val = tensor("constant")]; tensor const_23_to_fp16 = const()[name = tensor("const_23_to_fp16"), val = tensor(0x0p+0)]; tensor x_9_cast_fp16 = pad(constant_val = const_23_to_fp16, mode = x_9_mode_0, pad = x_9_pad_0, x = x_7_cast_fp16)[name = tensor("x_9_cast_fp16")]; tensor var_368 = const()[name = tensor("op_368"), val = tensor([1, 8, -1, 3])]; tensor x_11_cast_fp16 = reshape(shape = var_368, x = x_9_cast_fp16)[name = tensor("x_11_cast_fp16")]; tensor var_372_begin_0 = const()[name = tensor("op_372_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_372_end_0 = const()[name = tensor("op_372_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_372_end_mask_0 = const()[name = tensor("op_372_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_372_cast_fp16 = slice_by_index(begin = var_372_begin_0, end = var_372_end_0, end_mask = var_372_end_mask_0, x = x_11_cast_fp16)[name = tensor("op_372_cast_fp16")]; tensor var_373 = const()[name = tensor("op_373"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_1_cast_fp16 = reshape(shape = var_373, x = var_372_cast_fp16)[name = tensor("matrix_bd_1_cast_fp16")]; tensor matrix_ac_1_transpose_x_0 = const()[name = tensor("matrix_ac_1_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_1_transpose_y_0 = const()[name = tensor("matrix_ac_1_transpose_y_0"), val = tensor(false)]; tensor transpose_51_perm_0 = const()[name = tensor("transpose_51_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_52_perm_0 = const()[name = tensor("transpose_52_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_52 = transpose(perm = transpose_52_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_235")]; tensor transpose_51 = transpose(perm = transpose_51_perm_0, x = var_356_cast_fp16)[name = tensor("transpose_236")]; tensor matrix_ac_1_cast_fp16 = matmul(transpose_x = matrix_ac_1_transpose_x_0, transpose_y = matrix_ac_1_transpose_y_0, x = transpose_51, y = transpose_52)[name = tensor("matrix_ac_1_cast_fp16")]; tensor matrix_bd_3_begin_0 = const()[name = tensor("matrix_bd_3_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_3_end_0 = const()[name = tensor("matrix_bd_3_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_3_end_mask_0 = const()[name = tensor("matrix_bd_3_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_3_cast_fp16 = slice_by_index(begin = matrix_bd_3_begin_0, end = matrix_bd_3_end_0, end_mask = matrix_bd_3_end_mask_0, x = matrix_bd_1_cast_fp16)[name = tensor("matrix_bd_3_cast_fp16")]; tensor var_382_cast_fp16 = add(x = matrix_ac_1_cast_fp16, y = matrix_bd_3_cast_fp16)[name = tensor("op_382_cast_fp16")]; tensor _inversed_scores_1_y_0_to_fp16 = const()[name = tensor("_inversed_scores_1_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_1_cast_fp16 = mul(x = var_382_cast_fp16, y = _inversed_scores_1_y_0_to_fp16)[name = tensor("_inversed_scores_1_cast_fp16")]; tensor mask_3_axes_0 = const()[name = tensor("mask_3_axes_0"), val = tensor([1])]; tensor mask_3 = expand_dims(axes = mask_3_axes_0, x = mask_1)[name = tensor("mask_3")]; tensor var_41_to_fp16 = const()[name = tensor("op_41_to_fp16"), val = tensor(-0x1.388p+13)]; tensor scores_3_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_1_cast_fp16, cond = mask_3)[name = tensor("scores_3_cast_fp16")]; tensor var_388_cast_fp16 = softmax(axis = var_62, x = scores_3_cast_fp16)[name = tensor("op_388_cast_fp16")]; tensor var_40_to_fp16 = const()[name = tensor("op_40_to_fp16"), val = tensor(0x0p+0)]; tensor input_41_cast_fp16 = select(a = var_40_to_fp16, b = var_388_cast_fp16, cond = mask_3)[name = tensor("input_41_cast_fp16")]; tensor x_13_transpose_x_0 = const()[name = tensor("x_13_transpose_x_0"), val = tensor(false)]; tensor x_13_transpose_y_0 = const()[name = tensor("x_13_transpose_y_0"), val = tensor(false)]; tensor value_3_cast_fp16 = transpose(perm = value_3_perm_0, x = v_1_cast_fp16)[name = tensor("transpose_238")]; tensor x_13_cast_fp16 = matmul(transpose_x = x_13_transpose_x_0, transpose_y = x_13_transpose_y_0, x = input_41_cast_fp16, y = value_3_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_392_perm_0 = const()[name = tensor("op_392_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_393 = const()[name = tensor("op_393"), val = tensor([1, -1, 512])]; tensor var_392_cast_fp16 = transpose(perm = var_392_perm_0, x = x_13_cast_fp16)[name = tensor("transpose_234")]; tensor input_43_cast_fp16 = reshape(shape = var_393, x = var_392_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor encoder_layers_0_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_0_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10664896)))]; tensor linear_7_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_self_attn_linear_out_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor input_47_cast_fp16 = add(x = input_37_cast_fp16, y = linear_7_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor x_17_axes_0 = const()[name = tensor("x_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11189248)))]; tensor encoder_layers_0_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11190336)))]; tensor x_17_cast_fp16 = layer_norm(axes = x_17_axes_0, beta = encoder_layers_0_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_norm_conv_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor input_49_perm_0 = const()[name = tensor("input_49_perm_0"), val = tensor([0, 2, 1])]; tensor input_51_pad_type_0 = const()[name = tensor("input_51_pad_type_0"), val = tensor("valid")]; tensor input_51_strides_0 = const()[name = tensor("input_51_strides_0"), val = tensor([1])]; tensor input_51_pad_0 = const()[name = tensor("input_51_pad_0"), val = tensor([0, 0])]; tensor input_51_dilations_0 = const()[name = tensor("input_51_dilations_0"), val = tensor([1])]; tensor input_51_groups_0 = const()[name = tensor("input_51_groups_0"), val = tensor(1)]; tensor encoder_layers_0_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11191424)))]; tensor input_49_cast_fp16 = transpose(perm = input_49_perm_0, x = x_17_cast_fp16)[name = tensor("transpose_233")]; tensor input_51_cast_fp16 = conv(dilations = input_51_dilations_0, groups = input_51_groups_0, pad = input_51_pad_0, pad_type = input_51_pad_type_0, strides = input_51_strides_0, weight = encoder_layers_0_conv_pointwise_conv1_weight_to_fp16, x = input_49_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor x_19_split_num_splits_0 = const()[name = tensor("x_19_split_num_splits_0"), val = tensor(2)]; tensor x_19_split_axis_0 = const()[name = tensor("x_19_split_axis_0"), val = tensor(1)]; tensor x_19_split_cast_fp16_0, tensor x_19_split_cast_fp16_1 = split(axis = x_19_split_axis_0, num_splits = x_19_split_num_splits_0, x = input_51_cast_fp16)[name = tensor("x_19_split_cast_fp16")]; tensor x_19_split_1_sigmoid_cast_fp16 = sigmoid(x = x_19_split_cast_fp16_1)[name = tensor("x_19_split_1_sigmoid_cast_fp16")]; tensor x_19_cast_fp16 = mul(x = x_19_split_cast_fp16_0, y = x_19_split_1_sigmoid_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_418_axes_0 = const()[name = tensor("op_418_axes_0"), val = tensor([1])]; tensor var_418 = expand_dims(axes = var_418_axes_0, x = pad_mask)[name = tensor("op_418")]; tensor input_53_cast_fp16 = select(a = var_40_to_fp16, b = x_19_cast_fp16, cond = var_418)[name = tensor("input_53_cast_fp16")]; tensor new_x_3_interleave_0 = const()[name = tensor("new_x_3_interleave_0"), val = tensor(false)]; tensor new_x_3_cast_fp16 = concat(axis = var_62, interleave = new_x_3_interleave_0, values = (cache_3_cast_fp16, input_53_cast_fp16))[name = tensor("new_x_3_cast_fp16")]; tensor next_cache_1_begin_0 = const()[name = tensor("next_cache_1_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_1_end_0 = const()[name = tensor("next_cache_1_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_1_end_mask_0 = const()[name = tensor("next_cache_1_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_1_cast_fp16 = slice_by_index(begin = next_cache_1_begin_0, end = next_cache_1_end_0, end_mask = next_cache_1_end_mask_0, x = new_x_3_cast_fp16)[name = tensor("next_cache_1_cast_fp16")]; tensor var_434_begin_0 = const()[name = tensor("op_434_begin_0"), val = tensor([0, 0, 1])]; tensor var_434_end_0 = const()[name = tensor("op_434_end_0"), val = tensor([1, 512, 9])]; tensor var_434_end_mask_0 = const()[name = tensor("op_434_end_mask_0"), val = tensor([true, true, true])]; tensor var_434_cast_fp16 = slice_by_index(begin = var_434_begin_0, end = var_434_end_0, end_mask = var_434_end_mask_0, x = next_cache_1_cast_fp16)[name = tensor("op_434_cast_fp16")]; tensor x_21_pad_type_0 = const()[name = tensor("x_21_pad_type_0"), val = tensor("valid")]; tensor x_21_groups_0 = const()[name = tensor("x_21_groups_0"), val = tensor(512)]; tensor x_21_strides_0 = const()[name = tensor("x_21_strides_0"), val = tensor([1])]; tensor x_21_pad_0 = const()[name = tensor("x_21_pad_0"), val = tensor([0, 0])]; tensor x_21_dilations_0 = const()[name = tensor("x_21_dilations_0"), val = tensor([1])]; tensor encoder_layers_0_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_0_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12240064)))]; tensor x_21_cast_fp16 = conv(dilations = x_21_dilations_0, groups = x_21_groups_0, pad = x_21_pad_0, pad_type = x_21_pad_type_0, strides = x_21_strides_0, weight = encoder_layers_0_conv_depthwise_conv_weight_to_fp16, x = new_x_3_cast_fp16)[name = tensor("x_21_cast_fp16")]; tensor input_55_perm_0 = const()[name = tensor("input_55_perm_0"), val = tensor([0, 2, 1])]; tensor x_23_axes_0 = const()[name = tensor("x_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_0_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12249344)))]; tensor encoder_layers_0_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_0_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12250432)))]; tensor input_55_cast_fp16 = transpose(perm = input_55_perm_0, x = x_21_cast_fp16)[name = tensor("transpose_232")]; tensor x_23_cast_fp16 = layer_norm(axes = x_23_axes_0, beta = encoder_layers_0_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_conv_batch_norm_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("x_23_cast_fp16")]; tensor input_57_perm_0 = const()[name = tensor("input_57_perm_0"), val = tensor([0, 2, 1])]; tensor input_57_cast_fp16 = transpose(perm = input_57_perm_0, x = x_23_cast_fp16)[name = tensor("transpose_231")]; tensor input_59_cast_fp16 = silu(x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor x_25_pad_type_0 = const()[name = tensor("x_25_pad_type_0"), val = tensor("valid")]; tensor x_25_strides_0 = const()[name = tensor("x_25_strides_0"), val = tensor([1])]; tensor x_25_pad_0 = const()[name = tensor("x_25_pad_0"), val = tensor([0, 0])]; tensor x_25_dilations_0 = const()[name = tensor("x_25_dilations_0"), val = tensor([1])]; tensor x_25_groups_0 = const()[name = tensor("x_25_groups_0"), val = tensor(1)]; tensor encoder_layers_0_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12251520)))]; tensor x_25_cast_fp16 = conv(dilations = x_25_dilations_0, groups = x_25_groups_0, pad = x_25_pad_0, pad_type = x_25_pad_type_0, strides = x_25_strides_0, weight = encoder_layers_0_conv_pointwise_conv2_weight_to_fp16, x = input_59_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor input_61_perm_0 = const()[name = tensor("input_61_perm_0"), val = tensor([0, 2, 1])]; tensor input_61_cast_fp16 = transpose(perm = input_61_perm_0, x = x_25_cast_fp16)[name = tensor("transpose_230")]; tensor input_63_cast_fp16 = add(x = input_47_cast_fp16, y = input_61_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor input_65_axes_0 = const()[name = tensor("input_65_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12775872)))]; tensor encoder_layers_0_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12776960)))]; tensor input_65_cast_fp16 = layer_norm(axes = input_65_axes_0, beta = encoder_layers_0_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_norm_feed_forward2_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor encoder_layers_0_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12778048)))]; tensor linear_8_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_0_feed_forward2_linear1_weight_to_fp16, x = input_65_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor input_69_cast_fp16 = silu(x = linear_8_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor encoder_layers_0_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_0_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14875264)))]; tensor linear_9_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_0_feed_forward2_linear2_weight_to_fp16, x = input_69_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor var_475_to_fp16 = const()[name = tensor("op_475_to_fp16"), val = tensor(0x1p-1)]; tensor var_476_cast_fp16 = mul(x = linear_9_cast_fp16, y = var_475_to_fp16)[name = tensor("op_476_cast_fp16")]; tensor input_75_cast_fp16 = add(x = input_63_cast_fp16, y = var_476_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor input_77_axes_0 = const()[name = tensor("input_77_axes_0"), val = tensor([-1])]; tensor encoder_layers_0_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_0_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16972480)))]; tensor encoder_layers_0_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_0_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16973568)))]; tensor input_77_cast_fp16 = layer_norm(axes = input_77_axes_0, beta = encoder_layers_0_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_0_norm_out_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor cache_5_begin_0 = const()[name = tensor("cache_5_begin_0"), val = tensor([1, 0, 0, 0])]; tensor cache_5_end_0 = const()[name = tensor("cache_5_end_0"), val = tensor([2, 1, 70, 512])]; tensor cache_5_end_mask_0 = const()[name = tensor("cache_5_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_5_squeeze_mask_0 = const()[name = tensor("cache_5_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_5_cast_fp16 = slice_by_index(begin = cache_5_begin_0, end = cache_5_end_0, end_mask = cache_5_end_mask_0, squeeze_mask = cache_5_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_5_cast_fp16")]; tensor cache_7_begin_0 = const()[name = tensor("cache_7_begin_0"), val = tensor([1, 0, 0, 0])]; tensor cache_7_end_0 = const()[name = tensor("cache_7_end_0"), val = tensor([2, 1, 512, 8])]; tensor cache_7_end_mask_0 = const()[name = tensor("cache_7_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_7_squeeze_mask_0 = const()[name = tensor("cache_7_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_7_cast_fp16 = slice_by_index(begin = cache_7_begin_0, end = cache_7_end_0, end_mask = cache_7_end_mask_0, squeeze_mask = cache_7_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_7_cast_fp16")]; tensor input_79_axes_0 = const()[name = tensor("input_79_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16974656)))]; tensor encoder_layers_1_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16975744)))]; tensor input_79_cast_fp16 = layer_norm(axes = input_79_axes_0, beta = encoder_layers_1_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_norm_feed_forward1_weight_to_fp16, x = input_77_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor encoder_layers_1_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16976832)))]; tensor linear_10_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_1_feed_forward1_linear1_weight_to_fp16, x = input_79_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor input_83_cast_fp16 = silu(x = linear_10_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor encoder_layers_1_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19074048)))]; tensor linear_11_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_feed_forward1_linear2_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor var_510_to_fp16 = const()[name = tensor("op_510_to_fp16"), val = tensor(0x1p-1)]; tensor var_511_cast_fp16 = mul(x = linear_11_cast_fp16, y = var_510_to_fp16)[name = tensor("op_511_cast_fp16")]; tensor input_89_cast_fp16 = add(x = input_77_cast_fp16, y = var_511_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor key_3_axes_0 = const()[name = tensor("key_3_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21171264)))]; tensor encoder_layers_1_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21172352)))]; tensor key_3_cast_fp16 = layer_norm(axes = key_3_axes_0, beta = encoder_layers_1_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_norm_self_att_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("key_3_cast_fp16")]; tensor input_91_interleave_0 = const()[name = tensor("input_91_interleave_0"), val = tensor(false)]; tensor input_91_cast_fp16 = concat(axis = var_64, interleave = input_91_interleave_0, values = (cache_5_cast_fp16, key_3_cast_fp16))[name = tensor("input_91_cast_fp16")]; tensor var_533_begin_0 = const()[name = tensor("op_533_begin_0"), val = tensor([0, 1, 0])]; tensor var_533_end_0 = const()[name = tensor("op_533_end_0"), val = tensor([1, 70, 512])]; tensor var_533_end_mask_0 = const()[name = tensor("op_533_end_mask_0"), val = tensor([true, true, true])]; tensor var_533_cast_fp16 = slice_by_index(begin = var_533_begin_0, end = var_533_end_0, end_mask = var_533_end_mask_0, x = cache_5_cast_fp16)[name = tensor("op_533_cast_fp16")]; tensor var_536_begin_0 = const()[name = tensor("op_536_begin_0"), val = tensor([0, 0, 0])]; tensor var_536_end_0 = const()[name = tensor("op_536_end_0"), val = tensor([1, 1, 512])]; tensor var_536_end_mask_0 = const()[name = tensor("op_536_end_mask_0"), val = tensor([true, false, true])]; tensor var_536_cast_fp16 = slice_by_index(begin = var_536_begin_0, end = var_536_end_0, end_mask = var_536_end_mask_0, x = key_3_cast_fp16)[name = tensor("op_536_cast_fp16")]; tensor var_539_interleave_0 = const()[name = tensor("op_539_interleave_0"), val = tensor(false)]; tensor var_539_cast_fp16 = concat(axis = var_64, interleave = var_539_interleave_0, values = (var_533_cast_fp16, var_536_cast_fp16))[name = tensor("op_539_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21173440)))]; tensor linear_12_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_self_attn_linear_q_weight_to_fp16, x = key_3_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_543 = const()[name = tensor("op_543"), val = tensor([1, -1, 8, 64])]; tensor q_7_cast_fp16 = reshape(shape = var_543, x = linear_12_cast_fp16)[name = tensor("q_7_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21697792)))]; tensor linear_13_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_self_attn_linear_k_weight_to_fp16, x = input_91_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_547 = const()[name = tensor("op_547"), val = tensor([1, -1, 8, 64])]; tensor k_5_cast_fp16 = reshape(shape = var_547, x = linear_13_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22222144)))]; tensor linear_14_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_self_attn_linear_v_weight_to_fp16, x = input_91_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_551 = const()[name = tensor("op_551"), val = tensor([1, -1, 8, 64])]; tensor v_3_cast_fp16 = reshape(shape = var_551, x = linear_14_cast_fp16)[name = tensor("v_3_cast_fp16")]; tensor value_5_perm_0 = const()[name = tensor("value_5_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_1_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22746496)))]; tensor var_563_cast_fp16 = add(x = q_7_cast_fp16, y = encoder_layers_1_self_attn_pos_bias_u_to_fp16)[name = tensor("op_563_cast_fp16")]; tensor encoder_layers_1_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22747584)))]; tensor var_565_cast_fp16 = add(x = q_7_cast_fp16, y = encoder_layers_1_self_attn_pos_bias_v_to_fp16)[name = tensor("op_565_cast_fp16")]; tensor q_with_bias_v_3_perm_0 = const()[name = tensor("q_with_bias_v_3_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_33_transpose_x_0 = const()[name = tensor("x_33_transpose_x_0"), val = tensor(false)]; tensor x_33_transpose_y_0 = const()[name = tensor("x_33_transpose_y_0"), val = tensor(false)]; tensor var_567_to_fp16 = const()[name = tensor("op_567_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22748672)))]; tensor q_with_bias_v_3_cast_fp16 = transpose(perm = q_with_bias_v_3_perm_0, x = var_565_cast_fp16)[name = tensor("transpose_228")]; tensor x_33_cast_fp16 = matmul(transpose_x = x_33_transpose_x_0, transpose_y = x_33_transpose_y_0, x = q_with_bias_v_3_cast_fp16, y = var_567_to_fp16)[name = tensor("x_33_cast_fp16")]; tensor x_35_pad_0 = const()[name = tensor("x_35_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_35_mode_0 = const()[name = tensor("x_35_mode_0"), val = tensor("constant")]; tensor const_36_to_fp16 = const()[name = tensor("const_36_to_fp16"), val = tensor(0x0p+0)]; tensor x_35_cast_fp16 = pad(constant_val = const_36_to_fp16, mode = x_35_mode_0, pad = x_35_pad_0, x = x_33_cast_fp16)[name = tensor("x_35_cast_fp16")]; tensor var_575 = const()[name = tensor("op_575"), val = tensor([1, 8, -1, 3])]; tensor x_37_cast_fp16 = reshape(shape = var_575, x = x_35_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor var_579_begin_0 = const()[name = tensor("op_579_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_579_end_0 = const()[name = tensor("op_579_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_579_end_mask_0 = const()[name = tensor("op_579_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_579_cast_fp16 = slice_by_index(begin = var_579_begin_0, end = var_579_end_0, end_mask = var_579_end_mask_0, x = x_37_cast_fp16)[name = tensor("op_579_cast_fp16")]; tensor var_580 = const()[name = tensor("op_580"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_5_cast_fp16 = reshape(shape = var_580, x = var_579_cast_fp16)[name = tensor("matrix_bd_5_cast_fp16")]; tensor matrix_ac_3_transpose_x_0 = const()[name = tensor("matrix_ac_3_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_3_transpose_y_0 = const()[name = tensor("matrix_ac_3_transpose_y_0"), val = tensor(false)]; tensor transpose_53_perm_0 = const()[name = tensor("transpose_53_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_54_perm_0 = const()[name = tensor("transpose_54_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_54 = transpose(perm = transpose_54_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_226")]; tensor transpose_53 = transpose(perm = transpose_53_perm_0, x = var_563_cast_fp16)[name = tensor("transpose_227")]; tensor matrix_ac_3_cast_fp16 = matmul(transpose_x = matrix_ac_3_transpose_x_0, transpose_y = matrix_ac_3_transpose_y_0, x = transpose_53, y = transpose_54)[name = tensor("matrix_ac_3_cast_fp16")]; tensor matrix_bd_7_begin_0 = const()[name = tensor("matrix_bd_7_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_7_end_0 = const()[name = tensor("matrix_bd_7_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_7_end_mask_0 = const()[name = tensor("matrix_bd_7_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_7_cast_fp16 = slice_by_index(begin = matrix_bd_7_begin_0, end = matrix_bd_7_end_0, end_mask = matrix_bd_7_end_mask_0, x = matrix_bd_5_cast_fp16)[name = tensor("matrix_bd_7_cast_fp16")]; tensor var_589_cast_fp16 = add(x = matrix_ac_3_cast_fp16, y = matrix_bd_7_cast_fp16)[name = tensor("op_589_cast_fp16")]; tensor _inversed_scores_5_y_0_to_fp16 = const()[name = tensor("_inversed_scores_5_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_5_cast_fp16 = mul(x = var_589_cast_fp16, y = _inversed_scores_5_y_0_to_fp16)[name = tensor("_inversed_scores_5_cast_fp16")]; tensor scores_7_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_5_cast_fp16, cond = mask_3)[name = tensor("scores_7_cast_fp16")]; tensor var_595_cast_fp16 = softmax(axis = var_62, x = scores_7_cast_fp16)[name = tensor("op_595_cast_fp16")]; tensor input_93_cast_fp16 = select(a = var_40_to_fp16, b = var_595_cast_fp16, cond = mask_3)[name = tensor("input_93_cast_fp16")]; tensor x_39_transpose_x_0 = const()[name = tensor("x_39_transpose_x_0"), val = tensor(false)]; tensor x_39_transpose_y_0 = const()[name = tensor("x_39_transpose_y_0"), val = tensor(false)]; tensor value_5_cast_fp16 = transpose(perm = value_5_perm_0, x = v_3_cast_fp16)[name = tensor("transpose_229")]; tensor x_39_cast_fp16 = matmul(transpose_x = x_39_transpose_x_0, transpose_y = x_39_transpose_y_0, x = input_93_cast_fp16, y = value_5_cast_fp16)[name = tensor("x_39_cast_fp16")]; tensor var_599_perm_0 = const()[name = tensor("op_599_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_600 = const()[name = tensor("op_600"), val = tensor([1, -1, 512])]; tensor var_599_cast_fp16 = transpose(perm = var_599_perm_0, x = x_39_cast_fp16)[name = tensor("transpose_225")]; tensor input_95_cast_fp16 = reshape(shape = var_600, x = var_599_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor encoder_layers_1_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_1_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22897216)))]; tensor linear_16_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_self_attn_linear_out_weight_to_fp16, x = input_95_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_99_cast_fp16 = add(x = input_89_cast_fp16, y = linear_16_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor x_43_axes_0 = const()[name = tensor("x_43_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23421568)))]; tensor encoder_layers_1_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23422656)))]; tensor x_43_cast_fp16 = layer_norm(axes = x_43_axes_0, beta = encoder_layers_1_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_norm_conv_weight_to_fp16, x = input_99_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor input_101_perm_0 = const()[name = tensor("input_101_perm_0"), val = tensor([0, 2, 1])]; tensor input_103_pad_type_0 = const()[name = tensor("input_103_pad_type_0"), val = tensor("valid")]; tensor input_103_strides_0 = const()[name = tensor("input_103_strides_0"), val = tensor([1])]; tensor input_103_pad_0 = const()[name = tensor("input_103_pad_0"), val = tensor([0, 0])]; tensor input_103_dilations_0 = const()[name = tensor("input_103_dilations_0"), val = tensor([1])]; tensor input_103_groups_0 = const()[name = tensor("input_103_groups_0"), val = tensor(1)]; tensor encoder_layers_1_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23423744)))]; tensor input_101_cast_fp16 = transpose(perm = input_101_perm_0, x = x_43_cast_fp16)[name = tensor("transpose_224")]; tensor input_103_cast_fp16 = conv(dilations = input_103_dilations_0, groups = input_103_groups_0, pad = input_103_pad_0, pad_type = input_103_pad_type_0, strides = input_103_strides_0, weight = encoder_layers_1_conv_pointwise_conv1_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor x_45_split_num_splits_0 = const()[name = tensor("x_45_split_num_splits_0"), val = tensor(2)]; tensor x_45_split_axis_0 = const()[name = tensor("x_45_split_axis_0"), val = tensor(1)]; tensor x_45_split_cast_fp16_0, tensor x_45_split_cast_fp16_1 = split(axis = x_45_split_axis_0, num_splits = x_45_split_num_splits_0, x = input_103_cast_fp16)[name = tensor("x_45_split_cast_fp16")]; tensor x_45_split_1_sigmoid_cast_fp16 = sigmoid(x = x_45_split_cast_fp16_1)[name = tensor("x_45_split_1_sigmoid_cast_fp16")]; tensor x_45_cast_fp16 = mul(x = x_45_split_cast_fp16_0, y = x_45_split_1_sigmoid_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor input_105_cast_fp16 = select(a = var_40_to_fp16, b = x_45_cast_fp16, cond = var_418)[name = tensor("input_105_cast_fp16")]; tensor new_x_7_interleave_0 = const()[name = tensor("new_x_7_interleave_0"), val = tensor(false)]; tensor new_x_7_cast_fp16 = concat(axis = var_62, interleave = new_x_7_interleave_0, values = (cache_7_cast_fp16, input_105_cast_fp16))[name = tensor("new_x_7_cast_fp16")]; tensor next_cache_3_begin_0 = const()[name = tensor("next_cache_3_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_3_end_0 = const()[name = tensor("next_cache_3_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_3_end_mask_0 = const()[name = tensor("next_cache_3_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_3_cast_fp16 = slice_by_index(begin = next_cache_3_begin_0, end = next_cache_3_end_0, end_mask = next_cache_3_end_mask_0, x = new_x_7_cast_fp16)[name = tensor("next_cache_3_cast_fp16")]; tensor var_641_begin_0 = const()[name = tensor("op_641_begin_0"), val = tensor([0, 0, 1])]; tensor var_641_end_0 = const()[name = tensor("op_641_end_0"), val = tensor([1, 512, 9])]; tensor var_641_end_mask_0 = const()[name = tensor("op_641_end_mask_0"), val = tensor([true, true, true])]; tensor var_641_cast_fp16 = slice_by_index(begin = var_641_begin_0, end = var_641_end_0, end_mask = var_641_end_mask_0, x = next_cache_3_cast_fp16)[name = tensor("op_641_cast_fp16")]; tensor x_47_pad_type_0 = const()[name = tensor("x_47_pad_type_0"), val = tensor("valid")]; tensor x_47_groups_0 = const()[name = tensor("x_47_groups_0"), val = tensor(512)]; tensor x_47_strides_0 = const()[name = tensor("x_47_strides_0"), val = tensor([1])]; tensor x_47_pad_0 = const()[name = tensor("x_47_pad_0"), val = tensor([0, 0])]; tensor x_47_dilations_0 = const()[name = tensor("x_47_dilations_0"), val = tensor([1])]; tensor encoder_layers_1_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_1_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24472384)))]; tensor x_47_cast_fp16 = conv(dilations = x_47_dilations_0, groups = x_47_groups_0, pad = x_47_pad_0, pad_type = x_47_pad_type_0, strides = x_47_strides_0, weight = encoder_layers_1_conv_depthwise_conv_weight_to_fp16, x = new_x_7_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor input_107_perm_0 = const()[name = tensor("input_107_perm_0"), val = tensor([0, 2, 1])]; tensor x_49_axes_0 = const()[name = tensor("x_49_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_1_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24481664)))]; tensor encoder_layers_1_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_1_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24482752)))]; tensor input_107_cast_fp16 = transpose(perm = input_107_perm_0, x = x_47_cast_fp16)[name = tensor("transpose_223")]; tensor x_49_cast_fp16 = layer_norm(axes = x_49_axes_0, beta = encoder_layers_1_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_conv_batch_norm_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor input_109_perm_0 = const()[name = tensor("input_109_perm_0"), val = tensor([0, 2, 1])]; tensor input_109_cast_fp16 = transpose(perm = input_109_perm_0, x = x_49_cast_fp16)[name = tensor("transpose_222")]; tensor input_111_cast_fp16 = silu(x = input_109_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor x_51_pad_type_0 = const()[name = tensor("x_51_pad_type_0"), val = tensor("valid")]; tensor x_51_strides_0 = const()[name = tensor("x_51_strides_0"), val = tensor([1])]; tensor x_51_pad_0 = const()[name = tensor("x_51_pad_0"), val = tensor([0, 0])]; tensor x_51_dilations_0 = const()[name = tensor("x_51_dilations_0"), val = tensor([1])]; tensor x_51_groups_0 = const()[name = tensor("x_51_groups_0"), val = tensor(1)]; tensor encoder_layers_1_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24483840)))]; tensor x_51_cast_fp16 = conv(dilations = x_51_dilations_0, groups = x_51_groups_0, pad = x_51_pad_0, pad_type = x_51_pad_type_0, strides = x_51_strides_0, weight = encoder_layers_1_conv_pointwise_conv2_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("x_51_cast_fp16")]; tensor input_113_perm_0 = const()[name = tensor("input_113_perm_0"), val = tensor([0, 2, 1])]; tensor input_113_cast_fp16 = transpose(perm = input_113_perm_0, x = x_51_cast_fp16)[name = tensor("transpose_221")]; tensor input_115_cast_fp16 = add(x = input_99_cast_fp16, y = input_113_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor input_117_axes_0 = const()[name = tensor("input_117_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25008192)))]; tensor encoder_layers_1_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25009280)))]; tensor input_117_cast_fp16 = layer_norm(axes = input_117_axes_0, beta = encoder_layers_1_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_norm_feed_forward2_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor encoder_layers_1_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25010368)))]; tensor linear_17_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_1_feed_forward2_linear1_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor input_121_cast_fp16 = silu(x = linear_17_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor encoder_layers_1_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_1_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27107584)))]; tensor linear_18_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_1_feed_forward2_linear2_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_682_to_fp16 = const()[name = tensor("op_682_to_fp16"), val = tensor(0x1p-1)]; tensor var_683_cast_fp16 = mul(x = linear_18_cast_fp16, y = var_682_to_fp16)[name = tensor("op_683_cast_fp16")]; tensor input_127_cast_fp16 = add(x = input_115_cast_fp16, y = var_683_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor input_129_axes_0 = const()[name = tensor("input_129_axes_0"), val = tensor([-1])]; tensor encoder_layers_1_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_1_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29204800)))]; tensor encoder_layers_1_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_1_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29205888)))]; tensor input_129_cast_fp16 = layer_norm(axes = input_129_axes_0, beta = encoder_layers_1_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_1_norm_out_weight_to_fp16, x = input_127_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor cache_9_begin_0 = const()[name = tensor("cache_9_begin_0"), val = tensor([2, 0, 0, 0])]; tensor cache_9_end_0 = const()[name = tensor("cache_9_end_0"), val = tensor([3, 1, 70, 512])]; tensor cache_9_end_mask_0 = const()[name = tensor("cache_9_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_9_squeeze_mask_0 = const()[name = tensor("cache_9_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_9_cast_fp16 = slice_by_index(begin = cache_9_begin_0, end = cache_9_end_0, end_mask = cache_9_end_mask_0, squeeze_mask = cache_9_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_9_cast_fp16")]; tensor cache_11_begin_0 = const()[name = tensor("cache_11_begin_0"), val = tensor([2, 0, 0, 0])]; tensor cache_11_end_0 = const()[name = tensor("cache_11_end_0"), val = tensor([3, 1, 512, 8])]; tensor cache_11_end_mask_0 = const()[name = tensor("cache_11_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_11_squeeze_mask_0 = const()[name = tensor("cache_11_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_11_cast_fp16 = slice_by_index(begin = cache_11_begin_0, end = cache_11_end_0, end_mask = cache_11_end_mask_0, squeeze_mask = cache_11_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_11_cast_fp16")]; tensor input_131_axes_0 = const()[name = tensor("input_131_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29206976)))]; tensor encoder_layers_2_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29208064)))]; tensor input_131_cast_fp16 = layer_norm(axes = input_131_axes_0, beta = encoder_layers_2_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_norm_feed_forward1_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor encoder_layers_2_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29209152)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_2_feed_forward1_linear1_weight_to_fp16, x = input_131_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor input_135_cast_fp16 = silu(x = linear_19_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor encoder_layers_2_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31306368)))]; tensor linear_20_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_feed_forward1_linear2_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_717_to_fp16 = const()[name = tensor("op_717_to_fp16"), val = tensor(0x1p-1)]; tensor var_718_cast_fp16 = mul(x = linear_20_cast_fp16, y = var_717_to_fp16)[name = tensor("op_718_cast_fp16")]; tensor input_141_cast_fp16 = add(x = input_129_cast_fp16, y = var_718_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor key_5_axes_0 = const()[name = tensor("key_5_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33403584)))]; tensor encoder_layers_2_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33404672)))]; tensor key_5_cast_fp16 = layer_norm(axes = key_5_axes_0, beta = encoder_layers_2_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_norm_self_att_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("key_5_cast_fp16")]; tensor input_143_interleave_0 = const()[name = tensor("input_143_interleave_0"), val = tensor(false)]; tensor input_143_cast_fp16 = concat(axis = var_64, interleave = input_143_interleave_0, values = (cache_9_cast_fp16, key_5_cast_fp16))[name = tensor("input_143_cast_fp16")]; tensor var_740_begin_0 = const()[name = tensor("op_740_begin_0"), val = tensor([0, 1, 0])]; tensor var_740_end_0 = const()[name = tensor("op_740_end_0"), val = tensor([1, 70, 512])]; tensor var_740_end_mask_0 = const()[name = tensor("op_740_end_mask_0"), val = tensor([true, true, true])]; tensor var_740_cast_fp16 = slice_by_index(begin = var_740_begin_0, end = var_740_end_0, end_mask = var_740_end_mask_0, x = cache_9_cast_fp16)[name = tensor("op_740_cast_fp16")]; tensor var_743_begin_0 = const()[name = tensor("op_743_begin_0"), val = tensor([0, 0, 0])]; tensor var_743_end_0 = const()[name = tensor("op_743_end_0"), val = tensor([1, 1, 512])]; tensor var_743_end_mask_0 = const()[name = tensor("op_743_end_mask_0"), val = tensor([true, false, true])]; tensor var_743_cast_fp16 = slice_by_index(begin = var_743_begin_0, end = var_743_end_0, end_mask = var_743_end_mask_0, x = key_5_cast_fp16)[name = tensor("op_743_cast_fp16")]; tensor var_746_interleave_0 = const()[name = tensor("op_746_interleave_0"), val = tensor(false)]; tensor var_746_cast_fp16 = concat(axis = var_64, interleave = var_746_interleave_0, values = (var_740_cast_fp16, var_743_cast_fp16))[name = tensor("op_746_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33405760)))]; tensor linear_21_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_self_attn_linear_q_weight_to_fp16, x = key_5_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor var_750 = const()[name = tensor("op_750"), val = tensor([1, -1, 8, 64])]; tensor q_13_cast_fp16 = reshape(shape = var_750, x = linear_21_cast_fp16)[name = tensor("q_13_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33930112)))]; tensor linear_22_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_self_attn_linear_k_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor var_754 = const()[name = tensor("op_754"), val = tensor([1, -1, 8, 64])]; tensor k_9_cast_fp16 = reshape(shape = var_754, x = linear_22_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34454464)))]; tensor linear_23_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_self_attn_linear_v_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor var_758 = const()[name = tensor("op_758"), val = tensor([1, -1, 8, 64])]; tensor v_5_cast_fp16 = reshape(shape = var_758, x = linear_23_cast_fp16)[name = tensor("v_5_cast_fp16")]; tensor value_7_perm_0 = const()[name = tensor("value_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_2_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34978816)))]; tensor var_770_cast_fp16 = add(x = q_13_cast_fp16, y = encoder_layers_2_self_attn_pos_bias_u_to_fp16)[name = tensor("op_770_cast_fp16")]; tensor encoder_layers_2_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34979904)))]; tensor var_772_cast_fp16 = add(x = q_13_cast_fp16, y = encoder_layers_2_self_attn_pos_bias_v_to_fp16)[name = tensor("op_772_cast_fp16")]; tensor q_with_bias_v_5_perm_0 = const()[name = tensor("q_with_bias_v_5_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_59_transpose_x_0 = const()[name = tensor("x_59_transpose_x_0"), val = tensor(false)]; tensor x_59_transpose_y_0 = const()[name = tensor("x_59_transpose_y_0"), val = tensor(false)]; tensor var_774_to_fp16 = const()[name = tensor("op_774_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34980992)))]; tensor q_with_bias_v_5_cast_fp16 = transpose(perm = q_with_bias_v_5_perm_0, x = var_772_cast_fp16)[name = tensor("transpose_219")]; tensor x_59_cast_fp16 = matmul(transpose_x = x_59_transpose_x_0, transpose_y = x_59_transpose_y_0, x = q_with_bias_v_5_cast_fp16, y = var_774_to_fp16)[name = tensor("x_59_cast_fp16")]; tensor x_61_pad_0 = const()[name = tensor("x_61_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_61_mode_0 = const()[name = tensor("x_61_mode_0"), val = tensor("constant")]; tensor const_49_to_fp16 = const()[name = tensor("const_49_to_fp16"), val = tensor(0x0p+0)]; tensor x_61_cast_fp16 = pad(constant_val = const_49_to_fp16, mode = x_61_mode_0, pad = x_61_pad_0, x = x_59_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor var_782 = const()[name = tensor("op_782"), val = tensor([1, 8, -1, 3])]; tensor x_63_cast_fp16 = reshape(shape = var_782, x = x_61_cast_fp16)[name = tensor("x_63_cast_fp16")]; tensor var_786_begin_0 = const()[name = tensor("op_786_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_786_end_0 = const()[name = tensor("op_786_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_786_end_mask_0 = const()[name = tensor("op_786_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_786_cast_fp16 = slice_by_index(begin = var_786_begin_0, end = var_786_end_0, end_mask = var_786_end_mask_0, x = x_63_cast_fp16)[name = tensor("op_786_cast_fp16")]; tensor var_787 = const()[name = tensor("op_787"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_9_cast_fp16 = reshape(shape = var_787, x = var_786_cast_fp16)[name = tensor("matrix_bd_9_cast_fp16")]; tensor matrix_ac_5_transpose_x_0 = const()[name = tensor("matrix_ac_5_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_5_transpose_y_0 = const()[name = tensor("matrix_ac_5_transpose_y_0"), val = tensor(false)]; tensor transpose_55_perm_0 = const()[name = tensor("transpose_55_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_56_perm_0 = const()[name = tensor("transpose_56_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_56 = transpose(perm = transpose_56_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_217")]; tensor transpose_55 = transpose(perm = transpose_55_perm_0, x = var_770_cast_fp16)[name = tensor("transpose_218")]; tensor matrix_ac_5_cast_fp16 = matmul(transpose_x = matrix_ac_5_transpose_x_0, transpose_y = matrix_ac_5_transpose_y_0, x = transpose_55, y = transpose_56)[name = tensor("matrix_ac_5_cast_fp16")]; tensor matrix_bd_11_begin_0 = const()[name = tensor("matrix_bd_11_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_11_end_0 = const()[name = tensor("matrix_bd_11_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_11_end_mask_0 = const()[name = tensor("matrix_bd_11_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_11_cast_fp16 = slice_by_index(begin = matrix_bd_11_begin_0, end = matrix_bd_11_end_0, end_mask = matrix_bd_11_end_mask_0, x = matrix_bd_9_cast_fp16)[name = tensor("matrix_bd_11_cast_fp16")]; tensor var_796_cast_fp16 = add(x = matrix_ac_5_cast_fp16, y = matrix_bd_11_cast_fp16)[name = tensor("op_796_cast_fp16")]; tensor _inversed_scores_9_y_0_to_fp16 = const()[name = tensor("_inversed_scores_9_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_9_cast_fp16 = mul(x = var_796_cast_fp16, y = _inversed_scores_9_y_0_to_fp16)[name = tensor("_inversed_scores_9_cast_fp16")]; tensor scores_11_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_9_cast_fp16, cond = mask_3)[name = tensor("scores_11_cast_fp16")]; tensor var_802_cast_fp16 = softmax(axis = var_62, x = scores_11_cast_fp16)[name = tensor("op_802_cast_fp16")]; tensor input_145_cast_fp16 = select(a = var_40_to_fp16, b = var_802_cast_fp16, cond = mask_3)[name = tensor("input_145_cast_fp16")]; tensor x_65_transpose_x_0 = const()[name = tensor("x_65_transpose_x_0"), val = tensor(false)]; tensor x_65_transpose_y_0 = const()[name = tensor("x_65_transpose_y_0"), val = tensor(false)]; tensor value_7_cast_fp16 = transpose(perm = value_7_perm_0, x = v_5_cast_fp16)[name = tensor("transpose_220")]; tensor x_65_cast_fp16 = matmul(transpose_x = x_65_transpose_x_0, transpose_y = x_65_transpose_y_0, x = input_145_cast_fp16, y = value_7_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor var_806_perm_0 = const()[name = tensor("op_806_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_807 = const()[name = tensor("op_807"), val = tensor([1, -1, 512])]; tensor var_806_cast_fp16 = transpose(perm = var_806_perm_0, x = x_65_cast_fp16)[name = tensor("transpose_216")]; tensor input_147_cast_fp16 = reshape(shape = var_807, x = var_806_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor encoder_layers_2_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_2_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35129536)))]; tensor linear_25_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_self_attn_linear_out_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor input_151_cast_fp16 = add(x = input_141_cast_fp16, y = linear_25_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor x_69_axes_0 = const()[name = tensor("x_69_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35653888)))]; tensor encoder_layers_2_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35654976)))]; tensor x_69_cast_fp16 = layer_norm(axes = x_69_axes_0, beta = encoder_layers_2_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_norm_conv_weight_to_fp16, x = input_151_cast_fp16)[name = tensor("x_69_cast_fp16")]; tensor input_153_perm_0 = const()[name = tensor("input_153_perm_0"), val = tensor([0, 2, 1])]; tensor input_155_pad_type_0 = const()[name = tensor("input_155_pad_type_0"), val = tensor("valid")]; tensor input_155_strides_0 = const()[name = tensor("input_155_strides_0"), val = tensor([1])]; tensor input_155_pad_0 = const()[name = tensor("input_155_pad_0"), val = tensor([0, 0])]; tensor input_155_dilations_0 = const()[name = tensor("input_155_dilations_0"), val = tensor([1])]; tensor input_155_groups_0 = const()[name = tensor("input_155_groups_0"), val = tensor(1)]; tensor encoder_layers_2_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35656064)))]; tensor input_153_cast_fp16 = transpose(perm = input_153_perm_0, x = x_69_cast_fp16)[name = tensor("transpose_215")]; tensor input_155_cast_fp16 = conv(dilations = input_155_dilations_0, groups = input_155_groups_0, pad = input_155_pad_0, pad_type = input_155_pad_type_0, strides = input_155_strides_0, weight = encoder_layers_2_conv_pointwise_conv1_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor x_71_split_num_splits_0 = const()[name = tensor("x_71_split_num_splits_0"), val = tensor(2)]; tensor x_71_split_axis_0 = const()[name = tensor("x_71_split_axis_0"), val = tensor(1)]; tensor x_71_split_cast_fp16_0, tensor x_71_split_cast_fp16_1 = split(axis = x_71_split_axis_0, num_splits = x_71_split_num_splits_0, x = input_155_cast_fp16)[name = tensor("x_71_split_cast_fp16")]; tensor x_71_split_1_sigmoid_cast_fp16 = sigmoid(x = x_71_split_cast_fp16_1)[name = tensor("x_71_split_1_sigmoid_cast_fp16")]; tensor x_71_cast_fp16 = mul(x = x_71_split_cast_fp16_0, y = x_71_split_1_sigmoid_cast_fp16)[name = tensor("x_71_cast_fp16")]; tensor input_157_cast_fp16 = select(a = var_40_to_fp16, b = x_71_cast_fp16, cond = var_418)[name = tensor("input_157_cast_fp16")]; tensor new_x_11_interleave_0 = const()[name = tensor("new_x_11_interleave_0"), val = tensor(false)]; tensor new_x_11_cast_fp16 = concat(axis = var_62, interleave = new_x_11_interleave_0, values = (cache_11_cast_fp16, input_157_cast_fp16))[name = tensor("new_x_11_cast_fp16")]; tensor next_cache_5_begin_0 = const()[name = tensor("next_cache_5_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_5_end_0 = const()[name = tensor("next_cache_5_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_5_end_mask_0 = const()[name = tensor("next_cache_5_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_5_cast_fp16 = slice_by_index(begin = next_cache_5_begin_0, end = next_cache_5_end_0, end_mask = next_cache_5_end_mask_0, x = new_x_11_cast_fp16)[name = tensor("next_cache_5_cast_fp16")]; tensor var_848_begin_0 = const()[name = tensor("op_848_begin_0"), val = tensor([0, 0, 1])]; tensor var_848_end_0 = const()[name = tensor("op_848_end_0"), val = tensor([1, 512, 9])]; tensor var_848_end_mask_0 = const()[name = tensor("op_848_end_mask_0"), val = tensor([true, true, true])]; tensor var_848_cast_fp16 = slice_by_index(begin = var_848_begin_0, end = var_848_end_0, end_mask = var_848_end_mask_0, x = next_cache_5_cast_fp16)[name = tensor("op_848_cast_fp16")]; tensor x_73_pad_type_0 = const()[name = tensor("x_73_pad_type_0"), val = tensor("valid")]; tensor x_73_groups_0 = const()[name = tensor("x_73_groups_0"), val = tensor(512)]; tensor x_73_strides_0 = const()[name = tensor("x_73_strides_0"), val = tensor([1])]; tensor x_73_pad_0 = const()[name = tensor("x_73_pad_0"), val = tensor([0, 0])]; tensor x_73_dilations_0 = const()[name = tensor("x_73_dilations_0"), val = tensor([1])]; tensor encoder_layers_2_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_2_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36704704)))]; tensor x_73_cast_fp16 = conv(dilations = x_73_dilations_0, groups = x_73_groups_0, pad = x_73_pad_0, pad_type = x_73_pad_type_0, strides = x_73_strides_0, weight = encoder_layers_2_conv_depthwise_conv_weight_to_fp16, x = new_x_11_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor input_159_perm_0 = const()[name = tensor("input_159_perm_0"), val = tensor([0, 2, 1])]; tensor x_75_axes_0 = const()[name = tensor("x_75_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_2_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36713984)))]; tensor encoder_layers_2_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_2_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36715072)))]; tensor input_159_cast_fp16 = transpose(perm = input_159_perm_0, x = x_73_cast_fp16)[name = tensor("transpose_214")]; tensor x_75_cast_fp16 = layer_norm(axes = x_75_axes_0, beta = encoder_layers_2_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_conv_batch_norm_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("x_75_cast_fp16")]; tensor input_161_perm_0 = const()[name = tensor("input_161_perm_0"), val = tensor([0, 2, 1])]; tensor input_161_cast_fp16 = transpose(perm = input_161_perm_0, x = x_75_cast_fp16)[name = tensor("transpose_213")]; tensor input_163_cast_fp16 = silu(x = input_161_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor x_77_pad_type_0 = const()[name = tensor("x_77_pad_type_0"), val = tensor("valid")]; tensor x_77_strides_0 = const()[name = tensor("x_77_strides_0"), val = tensor([1])]; tensor x_77_pad_0 = const()[name = tensor("x_77_pad_0"), val = tensor([0, 0])]; tensor x_77_dilations_0 = const()[name = tensor("x_77_dilations_0"), val = tensor([1])]; tensor x_77_groups_0 = const()[name = tensor("x_77_groups_0"), val = tensor(1)]; tensor encoder_layers_2_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36716160)))]; tensor x_77_cast_fp16 = conv(dilations = x_77_dilations_0, groups = x_77_groups_0, pad = x_77_pad_0, pad_type = x_77_pad_type_0, strides = x_77_strides_0, weight = encoder_layers_2_conv_pointwise_conv2_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor input_165_perm_0 = const()[name = tensor("input_165_perm_0"), val = tensor([0, 2, 1])]; tensor input_165_cast_fp16 = transpose(perm = input_165_perm_0, x = x_77_cast_fp16)[name = tensor("transpose_212")]; tensor input_167_cast_fp16 = add(x = input_151_cast_fp16, y = input_165_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor input_169_axes_0 = const()[name = tensor("input_169_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37240512)))]; tensor encoder_layers_2_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37241600)))]; tensor input_169_cast_fp16 = layer_norm(axes = input_169_axes_0, beta = encoder_layers_2_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_norm_feed_forward2_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor encoder_layers_2_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37242688)))]; tensor linear_26_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_2_feed_forward2_linear1_weight_to_fp16, x = input_169_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor input_173_cast_fp16 = silu(x = linear_26_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor encoder_layers_2_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_2_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39339904)))]; tensor linear_27_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_2_feed_forward2_linear2_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor var_889_to_fp16 = const()[name = tensor("op_889_to_fp16"), val = tensor(0x1p-1)]; tensor var_890_cast_fp16 = mul(x = linear_27_cast_fp16, y = var_889_to_fp16)[name = tensor("op_890_cast_fp16")]; tensor input_179_cast_fp16 = add(x = input_167_cast_fp16, y = var_890_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor input_181_axes_0 = const()[name = tensor("input_181_axes_0"), val = tensor([-1])]; tensor encoder_layers_2_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_2_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41437120)))]; tensor encoder_layers_2_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_2_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41438208)))]; tensor input_181_cast_fp16 = layer_norm(axes = input_181_axes_0, beta = encoder_layers_2_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_2_norm_out_weight_to_fp16, x = input_179_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor cache_13_begin_0 = const()[name = tensor("cache_13_begin_0"), val = tensor([3, 0, 0, 0])]; tensor cache_13_end_0 = const()[name = tensor("cache_13_end_0"), val = tensor([4, 1, 70, 512])]; tensor cache_13_end_mask_0 = const()[name = tensor("cache_13_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_13_squeeze_mask_0 = const()[name = tensor("cache_13_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_13_cast_fp16 = slice_by_index(begin = cache_13_begin_0, end = cache_13_end_0, end_mask = cache_13_end_mask_0, squeeze_mask = cache_13_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_13_cast_fp16")]; tensor cache_15_begin_0 = const()[name = tensor("cache_15_begin_0"), val = tensor([3, 0, 0, 0])]; tensor cache_15_end_0 = const()[name = tensor("cache_15_end_0"), val = tensor([4, 1, 512, 8])]; tensor cache_15_end_mask_0 = const()[name = tensor("cache_15_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_15_squeeze_mask_0 = const()[name = tensor("cache_15_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_15_cast_fp16 = slice_by_index(begin = cache_15_begin_0, end = cache_15_end_0, end_mask = cache_15_end_mask_0, squeeze_mask = cache_15_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_15_cast_fp16")]; tensor input_183_axes_0 = const()[name = tensor("input_183_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41439296)))]; tensor encoder_layers_3_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41440384)))]; tensor input_183_cast_fp16 = layer_norm(axes = input_183_axes_0, beta = encoder_layers_3_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_norm_feed_forward1_weight_to_fp16, x = input_181_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor encoder_layers_3_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41441472)))]; tensor linear_28_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_3_feed_forward1_linear1_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor input_187_cast_fp16 = silu(x = linear_28_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor encoder_layers_3_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43538688)))]; tensor linear_29_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_feed_forward1_linear2_weight_to_fp16, x = input_187_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor var_924_to_fp16 = const()[name = tensor("op_924_to_fp16"), val = tensor(0x1p-1)]; tensor var_925_cast_fp16 = mul(x = linear_29_cast_fp16, y = var_924_to_fp16)[name = tensor("op_925_cast_fp16")]; tensor input_193_cast_fp16 = add(x = input_181_cast_fp16, y = var_925_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor key_7_axes_0 = const()[name = tensor("key_7_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45635904)))]; tensor encoder_layers_3_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45636992)))]; tensor key_7_cast_fp16 = layer_norm(axes = key_7_axes_0, beta = encoder_layers_3_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_norm_self_att_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("key_7_cast_fp16")]; tensor input_195_interleave_0 = const()[name = tensor("input_195_interleave_0"), val = tensor(false)]; tensor input_195_cast_fp16 = concat(axis = var_64, interleave = input_195_interleave_0, values = (cache_13_cast_fp16, key_7_cast_fp16))[name = tensor("input_195_cast_fp16")]; tensor var_947_begin_0 = const()[name = tensor("op_947_begin_0"), val = tensor([0, 1, 0])]; tensor var_947_end_0 = const()[name = tensor("op_947_end_0"), val = tensor([1, 70, 512])]; tensor var_947_end_mask_0 = const()[name = tensor("op_947_end_mask_0"), val = tensor([true, true, true])]; tensor var_947_cast_fp16 = slice_by_index(begin = var_947_begin_0, end = var_947_end_0, end_mask = var_947_end_mask_0, x = cache_13_cast_fp16)[name = tensor("op_947_cast_fp16")]; tensor var_950_begin_0 = const()[name = tensor("op_950_begin_0"), val = tensor([0, 0, 0])]; tensor var_950_end_0 = const()[name = tensor("op_950_end_0"), val = tensor([1, 1, 512])]; tensor var_950_end_mask_0 = const()[name = tensor("op_950_end_mask_0"), val = tensor([true, false, true])]; tensor var_950_cast_fp16 = slice_by_index(begin = var_950_begin_0, end = var_950_end_0, end_mask = var_950_end_mask_0, x = key_7_cast_fp16)[name = tensor("op_950_cast_fp16")]; tensor var_953_interleave_0 = const()[name = tensor("op_953_interleave_0"), val = tensor(false)]; tensor var_953_cast_fp16 = concat(axis = var_64, interleave = var_953_interleave_0, values = (var_947_cast_fp16, var_950_cast_fp16))[name = tensor("op_953_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45638080)))]; tensor linear_30_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_self_attn_linear_q_weight_to_fp16, x = key_7_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_957 = const()[name = tensor("op_957"), val = tensor([1, -1, 8, 64])]; tensor q_19_cast_fp16 = reshape(shape = var_957, x = linear_30_cast_fp16)[name = tensor("q_19_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46162432)))]; tensor linear_31_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_self_attn_linear_k_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor var_961 = const()[name = tensor("op_961"), val = tensor([1, -1, 8, 64])]; tensor k_13_cast_fp16 = reshape(shape = var_961, x = linear_31_cast_fp16)[name = tensor("k_13_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46686784)))]; tensor linear_32_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_self_attn_linear_v_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_965 = const()[name = tensor("op_965"), val = tensor([1, -1, 8, 64])]; tensor v_7_cast_fp16 = reshape(shape = var_965, x = linear_32_cast_fp16)[name = tensor("v_7_cast_fp16")]; tensor value_9_perm_0 = const()[name = tensor("value_9_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_3_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47211136)))]; tensor var_977_cast_fp16 = add(x = q_19_cast_fp16, y = encoder_layers_3_self_attn_pos_bias_u_to_fp16)[name = tensor("op_977_cast_fp16")]; tensor encoder_layers_3_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47212224)))]; tensor var_979_cast_fp16 = add(x = q_19_cast_fp16, y = encoder_layers_3_self_attn_pos_bias_v_to_fp16)[name = tensor("op_979_cast_fp16")]; tensor q_with_bias_v_7_perm_0 = const()[name = tensor("q_with_bias_v_7_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_85_transpose_x_0 = const()[name = tensor("x_85_transpose_x_0"), val = tensor(false)]; tensor x_85_transpose_y_0 = const()[name = tensor("x_85_transpose_y_0"), val = tensor(false)]; tensor var_981_to_fp16 = const()[name = tensor("op_981_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47213312)))]; tensor q_with_bias_v_7_cast_fp16 = transpose(perm = q_with_bias_v_7_perm_0, x = var_979_cast_fp16)[name = tensor("transpose_210")]; tensor x_85_cast_fp16 = matmul(transpose_x = x_85_transpose_x_0, transpose_y = x_85_transpose_y_0, x = q_with_bias_v_7_cast_fp16, y = var_981_to_fp16)[name = tensor("x_85_cast_fp16")]; tensor x_87_pad_0 = const()[name = tensor("x_87_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_87_mode_0 = const()[name = tensor("x_87_mode_0"), val = tensor("constant")]; tensor const_62_to_fp16 = const()[name = tensor("const_62_to_fp16"), val = tensor(0x0p+0)]; tensor x_87_cast_fp16 = pad(constant_val = const_62_to_fp16, mode = x_87_mode_0, pad = x_87_pad_0, x = x_85_cast_fp16)[name = tensor("x_87_cast_fp16")]; tensor var_989 = const()[name = tensor("op_989"), val = tensor([1, 8, -1, 3])]; tensor x_89_cast_fp16 = reshape(shape = var_989, x = x_87_cast_fp16)[name = tensor("x_89_cast_fp16")]; tensor var_993_begin_0 = const()[name = tensor("op_993_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_993_end_0 = const()[name = tensor("op_993_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_993_end_mask_0 = const()[name = tensor("op_993_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_993_cast_fp16 = slice_by_index(begin = var_993_begin_0, end = var_993_end_0, end_mask = var_993_end_mask_0, x = x_89_cast_fp16)[name = tensor("op_993_cast_fp16")]; tensor var_994 = const()[name = tensor("op_994"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_13_cast_fp16 = reshape(shape = var_994, x = var_993_cast_fp16)[name = tensor("matrix_bd_13_cast_fp16")]; tensor matrix_ac_7_transpose_x_0 = const()[name = tensor("matrix_ac_7_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_7_transpose_y_0 = const()[name = tensor("matrix_ac_7_transpose_y_0"), val = tensor(false)]; tensor transpose_57_perm_0 = const()[name = tensor("transpose_57_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_58_perm_0 = const()[name = tensor("transpose_58_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_58 = transpose(perm = transpose_58_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_208")]; tensor transpose_57 = transpose(perm = transpose_57_perm_0, x = var_977_cast_fp16)[name = tensor("transpose_209")]; tensor matrix_ac_7_cast_fp16 = matmul(transpose_x = matrix_ac_7_transpose_x_0, transpose_y = matrix_ac_7_transpose_y_0, x = transpose_57, y = transpose_58)[name = tensor("matrix_ac_7_cast_fp16")]; tensor matrix_bd_15_begin_0 = const()[name = tensor("matrix_bd_15_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_15_end_0 = const()[name = tensor("matrix_bd_15_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_15_end_mask_0 = const()[name = tensor("matrix_bd_15_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_15_cast_fp16 = slice_by_index(begin = matrix_bd_15_begin_0, end = matrix_bd_15_end_0, end_mask = matrix_bd_15_end_mask_0, x = matrix_bd_13_cast_fp16)[name = tensor("matrix_bd_15_cast_fp16")]; tensor var_1003_cast_fp16 = add(x = matrix_ac_7_cast_fp16, y = matrix_bd_15_cast_fp16)[name = tensor("op_1003_cast_fp16")]; tensor _inversed_scores_13_y_0_to_fp16 = const()[name = tensor("_inversed_scores_13_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_13_cast_fp16 = mul(x = var_1003_cast_fp16, y = _inversed_scores_13_y_0_to_fp16)[name = tensor("_inversed_scores_13_cast_fp16")]; tensor scores_15_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_13_cast_fp16, cond = mask_3)[name = tensor("scores_15_cast_fp16")]; tensor var_1009_cast_fp16 = softmax(axis = var_62, x = scores_15_cast_fp16)[name = tensor("op_1009_cast_fp16")]; tensor input_197_cast_fp16 = select(a = var_40_to_fp16, b = var_1009_cast_fp16, cond = mask_3)[name = tensor("input_197_cast_fp16")]; tensor x_91_transpose_x_0 = const()[name = tensor("x_91_transpose_x_0"), val = tensor(false)]; tensor x_91_transpose_y_0 = const()[name = tensor("x_91_transpose_y_0"), val = tensor(false)]; tensor value_9_cast_fp16 = transpose(perm = value_9_perm_0, x = v_7_cast_fp16)[name = tensor("transpose_211")]; tensor x_91_cast_fp16 = matmul(transpose_x = x_91_transpose_x_0, transpose_y = x_91_transpose_y_0, x = input_197_cast_fp16, y = value_9_cast_fp16)[name = tensor("x_91_cast_fp16")]; tensor var_1013_perm_0 = const()[name = tensor("op_1013_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1014 = const()[name = tensor("op_1014"), val = tensor([1, -1, 512])]; tensor var_1013_cast_fp16 = transpose(perm = var_1013_perm_0, x = x_91_cast_fp16)[name = tensor("transpose_207")]; tensor input_199_cast_fp16 = reshape(shape = var_1014, x = var_1013_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor encoder_layers_3_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_3_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47361856)))]; tensor linear_34_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_self_attn_linear_out_weight_to_fp16, x = input_199_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor input_203_cast_fp16 = add(x = input_193_cast_fp16, y = linear_34_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor x_95_axes_0 = const()[name = tensor("x_95_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47886208)))]; tensor encoder_layers_3_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47887296)))]; tensor x_95_cast_fp16 = layer_norm(axes = x_95_axes_0, beta = encoder_layers_3_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_norm_conv_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor input_205_perm_0 = const()[name = tensor("input_205_perm_0"), val = tensor([0, 2, 1])]; tensor input_207_pad_type_0 = const()[name = tensor("input_207_pad_type_0"), val = tensor("valid")]; tensor input_207_strides_0 = const()[name = tensor("input_207_strides_0"), val = tensor([1])]; tensor input_207_pad_0 = const()[name = tensor("input_207_pad_0"), val = tensor([0, 0])]; tensor input_207_dilations_0 = const()[name = tensor("input_207_dilations_0"), val = tensor([1])]; tensor input_207_groups_0 = const()[name = tensor("input_207_groups_0"), val = tensor(1)]; tensor encoder_layers_3_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47888384)))]; tensor input_205_cast_fp16 = transpose(perm = input_205_perm_0, x = x_95_cast_fp16)[name = tensor("transpose_206")]; tensor input_207_cast_fp16 = conv(dilations = input_207_dilations_0, groups = input_207_groups_0, pad = input_207_pad_0, pad_type = input_207_pad_type_0, strides = input_207_strides_0, weight = encoder_layers_3_conv_pointwise_conv1_weight_to_fp16, x = input_205_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor x_97_split_num_splits_0 = const()[name = tensor("x_97_split_num_splits_0"), val = tensor(2)]; tensor x_97_split_axis_0 = const()[name = tensor("x_97_split_axis_0"), val = tensor(1)]; tensor x_97_split_cast_fp16_0, tensor x_97_split_cast_fp16_1 = split(axis = x_97_split_axis_0, num_splits = x_97_split_num_splits_0, x = input_207_cast_fp16)[name = tensor("x_97_split_cast_fp16")]; tensor x_97_split_1_sigmoid_cast_fp16 = sigmoid(x = x_97_split_cast_fp16_1)[name = tensor("x_97_split_1_sigmoid_cast_fp16")]; tensor x_97_cast_fp16 = mul(x = x_97_split_cast_fp16_0, y = x_97_split_1_sigmoid_cast_fp16)[name = tensor("x_97_cast_fp16")]; tensor input_209_cast_fp16 = select(a = var_40_to_fp16, b = x_97_cast_fp16, cond = var_418)[name = tensor("input_209_cast_fp16")]; tensor new_x_15_interleave_0 = const()[name = tensor("new_x_15_interleave_0"), val = tensor(false)]; tensor new_x_15_cast_fp16 = concat(axis = var_62, interleave = new_x_15_interleave_0, values = (cache_15_cast_fp16, input_209_cast_fp16))[name = tensor("new_x_15_cast_fp16")]; tensor next_cache_7_begin_0 = const()[name = tensor("next_cache_7_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_7_end_0 = const()[name = tensor("next_cache_7_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_7_end_mask_0 = const()[name = tensor("next_cache_7_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_7_cast_fp16 = slice_by_index(begin = next_cache_7_begin_0, end = next_cache_7_end_0, end_mask = next_cache_7_end_mask_0, x = new_x_15_cast_fp16)[name = tensor("next_cache_7_cast_fp16")]; tensor var_1055_begin_0 = const()[name = tensor("op_1055_begin_0"), val = tensor([0, 0, 1])]; tensor var_1055_end_0 = const()[name = tensor("op_1055_end_0"), val = tensor([1, 512, 9])]; tensor var_1055_end_mask_0 = const()[name = tensor("op_1055_end_mask_0"), val = tensor([true, true, true])]; tensor var_1055_cast_fp16 = slice_by_index(begin = var_1055_begin_0, end = var_1055_end_0, end_mask = var_1055_end_mask_0, x = next_cache_7_cast_fp16)[name = tensor("op_1055_cast_fp16")]; tensor x_99_pad_type_0 = const()[name = tensor("x_99_pad_type_0"), val = tensor("valid")]; tensor x_99_groups_0 = const()[name = tensor("x_99_groups_0"), val = tensor(512)]; tensor x_99_strides_0 = const()[name = tensor("x_99_strides_0"), val = tensor([1])]; tensor x_99_pad_0 = const()[name = tensor("x_99_pad_0"), val = tensor([0, 0])]; tensor x_99_dilations_0 = const()[name = tensor("x_99_dilations_0"), val = tensor([1])]; tensor encoder_layers_3_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_3_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48937024)))]; tensor x_99_cast_fp16 = conv(dilations = x_99_dilations_0, groups = x_99_groups_0, pad = x_99_pad_0, pad_type = x_99_pad_type_0, strides = x_99_strides_0, weight = encoder_layers_3_conv_depthwise_conv_weight_to_fp16, x = new_x_15_cast_fp16)[name = tensor("x_99_cast_fp16")]; tensor input_211_perm_0 = const()[name = tensor("input_211_perm_0"), val = tensor([0, 2, 1])]; tensor x_101_axes_0 = const()[name = tensor("x_101_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_3_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48946304)))]; tensor encoder_layers_3_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_3_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48947392)))]; tensor input_211_cast_fp16 = transpose(perm = input_211_perm_0, x = x_99_cast_fp16)[name = tensor("transpose_205")]; tensor x_101_cast_fp16 = layer_norm(axes = x_101_axes_0, beta = encoder_layers_3_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_conv_batch_norm_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor input_213_perm_0 = const()[name = tensor("input_213_perm_0"), val = tensor([0, 2, 1])]; tensor input_213_cast_fp16 = transpose(perm = input_213_perm_0, x = x_101_cast_fp16)[name = tensor("transpose_204")]; tensor input_215_cast_fp16 = silu(x = input_213_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor x_103_pad_type_0 = const()[name = tensor("x_103_pad_type_0"), val = tensor("valid")]; tensor x_103_strides_0 = const()[name = tensor("x_103_strides_0"), val = tensor([1])]; tensor x_103_pad_0 = const()[name = tensor("x_103_pad_0"), val = tensor([0, 0])]; tensor x_103_dilations_0 = const()[name = tensor("x_103_dilations_0"), val = tensor([1])]; tensor x_103_groups_0 = const()[name = tensor("x_103_groups_0"), val = tensor(1)]; tensor encoder_layers_3_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(48948480)))]; tensor x_103_cast_fp16 = conv(dilations = x_103_dilations_0, groups = x_103_groups_0, pad = x_103_pad_0, pad_type = x_103_pad_type_0, strides = x_103_strides_0, weight = encoder_layers_3_conv_pointwise_conv2_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("x_103_cast_fp16")]; tensor input_217_perm_0 = const()[name = tensor("input_217_perm_0"), val = tensor([0, 2, 1])]; tensor input_217_cast_fp16 = transpose(perm = input_217_perm_0, x = x_103_cast_fp16)[name = tensor("transpose_203")]; tensor input_219_cast_fp16 = add(x = input_203_cast_fp16, y = input_217_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_axes_0 = const()[name = tensor("input_221_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49472832)))]; tensor encoder_layers_3_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49473920)))]; tensor input_221_cast_fp16 = layer_norm(axes = input_221_axes_0, beta = encoder_layers_3_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_norm_feed_forward2_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor encoder_layers_3_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49475008)))]; tensor linear_35_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_3_feed_forward2_linear1_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor input_225_cast_fp16 = silu(x = linear_35_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor encoder_layers_3_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_3_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51572224)))]; tensor linear_36_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_3_feed_forward2_linear2_weight_to_fp16, x = input_225_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor var_1096_to_fp16 = const()[name = tensor("op_1096_to_fp16"), val = tensor(0x1p-1)]; tensor var_1097_cast_fp16 = mul(x = linear_36_cast_fp16, y = var_1096_to_fp16)[name = tensor("op_1097_cast_fp16")]; tensor input_231_cast_fp16 = add(x = input_219_cast_fp16, y = var_1097_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor input_233_axes_0 = const()[name = tensor("input_233_axes_0"), val = tensor([-1])]; tensor encoder_layers_3_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_3_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53669440)))]; tensor encoder_layers_3_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_3_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53670528)))]; tensor input_233_cast_fp16 = layer_norm(axes = input_233_axes_0, beta = encoder_layers_3_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_3_norm_out_weight_to_fp16, x = input_231_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor cache_17_begin_0 = const()[name = tensor("cache_17_begin_0"), val = tensor([4, 0, 0, 0])]; tensor cache_17_end_0 = const()[name = tensor("cache_17_end_0"), val = tensor([5, 1, 70, 512])]; tensor cache_17_end_mask_0 = const()[name = tensor("cache_17_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_17_squeeze_mask_0 = const()[name = tensor("cache_17_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_17_cast_fp16 = slice_by_index(begin = cache_17_begin_0, end = cache_17_end_0, end_mask = cache_17_end_mask_0, squeeze_mask = cache_17_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_17_cast_fp16")]; tensor cache_19_begin_0 = const()[name = tensor("cache_19_begin_0"), val = tensor([4, 0, 0, 0])]; tensor cache_19_end_0 = const()[name = tensor("cache_19_end_0"), val = tensor([5, 1, 512, 8])]; tensor cache_19_end_mask_0 = const()[name = tensor("cache_19_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_19_squeeze_mask_0 = const()[name = tensor("cache_19_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_19_cast_fp16 = slice_by_index(begin = cache_19_begin_0, end = cache_19_end_0, end_mask = cache_19_end_mask_0, squeeze_mask = cache_19_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_19_cast_fp16")]; tensor input_235_axes_0 = const()[name = tensor("input_235_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53671616)))]; tensor encoder_layers_4_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53672704)))]; tensor input_235_cast_fp16 = layer_norm(axes = input_235_axes_0, beta = encoder_layers_4_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_norm_feed_forward1_weight_to_fp16, x = input_233_cast_fp16)[name = tensor("input_235_cast_fp16")]; tensor encoder_layers_4_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53673792)))]; tensor linear_37_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_4_feed_forward1_linear1_weight_to_fp16, x = input_235_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor input_239_cast_fp16 = silu(x = linear_37_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor encoder_layers_4_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(55771008)))]; tensor linear_38_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_feed_forward1_linear2_weight_to_fp16, x = input_239_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_1131_to_fp16 = const()[name = tensor("op_1131_to_fp16"), val = tensor(0x1p-1)]; tensor var_1132_cast_fp16 = mul(x = linear_38_cast_fp16, y = var_1131_to_fp16)[name = tensor("op_1132_cast_fp16")]; tensor input_245_cast_fp16 = add(x = input_233_cast_fp16, y = var_1132_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor key_9_axes_0 = const()[name = tensor("key_9_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57868224)))]; tensor encoder_layers_4_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57869312)))]; tensor key_9_cast_fp16 = layer_norm(axes = key_9_axes_0, beta = encoder_layers_4_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_norm_self_att_weight_to_fp16, x = input_245_cast_fp16)[name = tensor("key_9_cast_fp16")]; tensor input_247_interleave_0 = const()[name = tensor("input_247_interleave_0"), val = tensor(false)]; tensor input_247_cast_fp16 = concat(axis = var_64, interleave = input_247_interleave_0, values = (cache_17_cast_fp16, key_9_cast_fp16))[name = tensor("input_247_cast_fp16")]; tensor var_1154_begin_0 = const()[name = tensor("op_1154_begin_0"), val = tensor([0, 1, 0])]; tensor var_1154_end_0 = const()[name = tensor("op_1154_end_0"), val = tensor([1, 70, 512])]; tensor var_1154_end_mask_0 = const()[name = tensor("op_1154_end_mask_0"), val = tensor([true, true, true])]; tensor var_1154_cast_fp16 = slice_by_index(begin = var_1154_begin_0, end = var_1154_end_0, end_mask = var_1154_end_mask_0, x = cache_17_cast_fp16)[name = tensor("op_1154_cast_fp16")]; tensor var_1157_begin_0 = const()[name = tensor("op_1157_begin_0"), val = tensor([0, 0, 0])]; tensor var_1157_end_0 = const()[name = tensor("op_1157_end_0"), val = tensor([1, 1, 512])]; tensor var_1157_end_mask_0 = const()[name = tensor("op_1157_end_mask_0"), val = tensor([true, false, true])]; tensor var_1157_cast_fp16 = slice_by_index(begin = var_1157_begin_0, end = var_1157_end_0, end_mask = var_1157_end_mask_0, x = key_9_cast_fp16)[name = tensor("op_1157_cast_fp16")]; tensor var_1160_interleave_0 = const()[name = tensor("op_1160_interleave_0"), val = tensor(false)]; tensor var_1160_cast_fp16 = concat(axis = var_64, interleave = var_1160_interleave_0, values = (var_1154_cast_fp16, var_1157_cast_fp16))[name = tensor("op_1160_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57870400)))]; tensor linear_39_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_self_attn_linear_q_weight_to_fp16, x = key_9_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor var_1164 = const()[name = tensor("op_1164"), val = tensor([1, -1, 8, 64])]; tensor q_25_cast_fp16 = reshape(shape = var_1164, x = linear_39_cast_fp16)[name = tensor("q_25_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(58394752)))]; tensor linear_40_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_self_attn_linear_k_weight_to_fp16, x = input_247_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor var_1168 = const()[name = tensor("op_1168"), val = tensor([1, -1, 8, 64])]; tensor k_17_cast_fp16 = reshape(shape = var_1168, x = linear_40_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(58919104)))]; tensor linear_41_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_self_attn_linear_v_weight_to_fp16, x = input_247_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor var_1172 = const()[name = tensor("op_1172"), val = tensor([1, -1, 8, 64])]; tensor v_9_cast_fp16 = reshape(shape = var_1172, x = linear_41_cast_fp16)[name = tensor("v_9_cast_fp16")]; tensor value_11_perm_0 = const()[name = tensor("value_11_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_4_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59443456)))]; tensor var_1184_cast_fp16 = add(x = q_25_cast_fp16, y = encoder_layers_4_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1184_cast_fp16")]; tensor encoder_layers_4_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59444544)))]; tensor var_1186_cast_fp16 = add(x = q_25_cast_fp16, y = encoder_layers_4_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1186_cast_fp16")]; tensor q_with_bias_v_9_perm_0 = const()[name = tensor("q_with_bias_v_9_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_111_transpose_x_0 = const()[name = tensor("x_111_transpose_x_0"), val = tensor(false)]; tensor x_111_transpose_y_0 = const()[name = tensor("x_111_transpose_y_0"), val = tensor(false)]; tensor var_1188_to_fp16 = const()[name = tensor("op_1188_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59445632)))]; tensor q_with_bias_v_9_cast_fp16 = transpose(perm = q_with_bias_v_9_perm_0, x = var_1186_cast_fp16)[name = tensor("transpose_201")]; tensor x_111_cast_fp16 = matmul(transpose_x = x_111_transpose_x_0, transpose_y = x_111_transpose_y_0, x = q_with_bias_v_9_cast_fp16, y = var_1188_to_fp16)[name = tensor("x_111_cast_fp16")]; tensor x_113_pad_0 = const()[name = tensor("x_113_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_113_mode_0 = const()[name = tensor("x_113_mode_0"), val = tensor("constant")]; tensor const_75_to_fp16 = const()[name = tensor("const_75_to_fp16"), val = tensor(0x0p+0)]; tensor x_113_cast_fp16 = pad(constant_val = const_75_to_fp16, mode = x_113_mode_0, pad = x_113_pad_0, x = x_111_cast_fp16)[name = tensor("x_113_cast_fp16")]; tensor var_1196 = const()[name = tensor("op_1196"), val = tensor([1, 8, -1, 3])]; tensor x_115_cast_fp16 = reshape(shape = var_1196, x = x_113_cast_fp16)[name = tensor("x_115_cast_fp16")]; tensor var_1200_begin_0 = const()[name = tensor("op_1200_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1200_end_0 = const()[name = tensor("op_1200_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_1200_end_mask_0 = const()[name = tensor("op_1200_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1200_cast_fp16 = slice_by_index(begin = var_1200_begin_0, end = var_1200_end_0, end_mask = var_1200_end_mask_0, x = x_115_cast_fp16)[name = tensor("op_1200_cast_fp16")]; tensor var_1201 = const()[name = tensor("op_1201"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_17_cast_fp16 = reshape(shape = var_1201, x = var_1200_cast_fp16)[name = tensor("matrix_bd_17_cast_fp16")]; tensor matrix_ac_9_transpose_x_0 = const()[name = tensor("matrix_ac_9_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_9_transpose_y_0 = const()[name = tensor("matrix_ac_9_transpose_y_0"), val = tensor(false)]; tensor transpose_59_perm_0 = const()[name = tensor("transpose_59_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_60_perm_0 = const()[name = tensor("transpose_60_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_60 = transpose(perm = transpose_60_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_199")]; tensor transpose_59 = transpose(perm = transpose_59_perm_0, x = var_1184_cast_fp16)[name = tensor("transpose_200")]; tensor matrix_ac_9_cast_fp16 = matmul(transpose_x = matrix_ac_9_transpose_x_0, transpose_y = matrix_ac_9_transpose_y_0, x = transpose_59, y = transpose_60)[name = tensor("matrix_ac_9_cast_fp16")]; tensor matrix_bd_19_begin_0 = const()[name = tensor("matrix_bd_19_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_19_end_0 = const()[name = tensor("matrix_bd_19_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_19_end_mask_0 = const()[name = tensor("matrix_bd_19_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_19_cast_fp16 = slice_by_index(begin = matrix_bd_19_begin_0, end = matrix_bd_19_end_0, end_mask = matrix_bd_19_end_mask_0, x = matrix_bd_17_cast_fp16)[name = tensor("matrix_bd_19_cast_fp16")]; tensor var_1210_cast_fp16 = add(x = matrix_ac_9_cast_fp16, y = matrix_bd_19_cast_fp16)[name = tensor("op_1210_cast_fp16")]; tensor _inversed_scores_17_y_0_to_fp16 = const()[name = tensor("_inversed_scores_17_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_17_cast_fp16 = mul(x = var_1210_cast_fp16, y = _inversed_scores_17_y_0_to_fp16)[name = tensor("_inversed_scores_17_cast_fp16")]; tensor scores_19_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_17_cast_fp16, cond = mask_3)[name = tensor("scores_19_cast_fp16")]; tensor var_1216_cast_fp16 = softmax(axis = var_62, x = scores_19_cast_fp16)[name = tensor("op_1216_cast_fp16")]; tensor input_249_cast_fp16 = select(a = var_40_to_fp16, b = var_1216_cast_fp16, cond = mask_3)[name = tensor("input_249_cast_fp16")]; tensor x_117_transpose_x_0 = const()[name = tensor("x_117_transpose_x_0"), val = tensor(false)]; tensor x_117_transpose_y_0 = const()[name = tensor("x_117_transpose_y_0"), val = tensor(false)]; tensor value_11_cast_fp16 = transpose(perm = value_11_perm_0, x = v_9_cast_fp16)[name = tensor("transpose_202")]; tensor x_117_cast_fp16 = matmul(transpose_x = x_117_transpose_x_0, transpose_y = x_117_transpose_y_0, x = input_249_cast_fp16, y = value_11_cast_fp16)[name = tensor("x_117_cast_fp16")]; tensor var_1220_perm_0 = const()[name = tensor("op_1220_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1221 = const()[name = tensor("op_1221"), val = tensor([1, -1, 512])]; tensor var_1220_cast_fp16 = transpose(perm = var_1220_perm_0, x = x_117_cast_fp16)[name = tensor("transpose_198")]; tensor input_251_cast_fp16 = reshape(shape = var_1221, x = var_1220_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor encoder_layers_4_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_4_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59594176)))]; tensor linear_43_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_self_attn_linear_out_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor input_255_cast_fp16 = add(x = input_245_cast_fp16, y = linear_43_cast_fp16)[name = tensor("input_255_cast_fp16")]; tensor x_121_axes_0 = const()[name = tensor("x_121_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60118528)))]; tensor encoder_layers_4_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60119616)))]; tensor x_121_cast_fp16 = layer_norm(axes = x_121_axes_0, beta = encoder_layers_4_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_norm_conv_weight_to_fp16, x = input_255_cast_fp16)[name = tensor("x_121_cast_fp16")]; tensor input_257_perm_0 = const()[name = tensor("input_257_perm_0"), val = tensor([0, 2, 1])]; tensor input_259_pad_type_0 = const()[name = tensor("input_259_pad_type_0"), val = tensor("valid")]; tensor input_259_strides_0 = const()[name = tensor("input_259_strides_0"), val = tensor([1])]; tensor input_259_pad_0 = const()[name = tensor("input_259_pad_0"), val = tensor([0, 0])]; tensor input_259_dilations_0 = const()[name = tensor("input_259_dilations_0"), val = tensor([1])]; tensor input_259_groups_0 = const()[name = tensor("input_259_groups_0"), val = tensor(1)]; tensor encoder_layers_4_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60120704)))]; tensor input_257_cast_fp16 = transpose(perm = input_257_perm_0, x = x_121_cast_fp16)[name = tensor("transpose_197")]; tensor input_259_cast_fp16 = conv(dilations = input_259_dilations_0, groups = input_259_groups_0, pad = input_259_pad_0, pad_type = input_259_pad_type_0, strides = input_259_strides_0, weight = encoder_layers_4_conv_pointwise_conv1_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor x_123_split_num_splits_0 = const()[name = tensor("x_123_split_num_splits_0"), val = tensor(2)]; tensor x_123_split_axis_0 = const()[name = tensor("x_123_split_axis_0"), val = tensor(1)]; tensor x_123_split_cast_fp16_0, tensor x_123_split_cast_fp16_1 = split(axis = x_123_split_axis_0, num_splits = x_123_split_num_splits_0, x = input_259_cast_fp16)[name = tensor("x_123_split_cast_fp16")]; tensor x_123_split_1_sigmoid_cast_fp16 = sigmoid(x = x_123_split_cast_fp16_1)[name = tensor("x_123_split_1_sigmoid_cast_fp16")]; tensor x_123_cast_fp16 = mul(x = x_123_split_cast_fp16_0, y = x_123_split_1_sigmoid_cast_fp16)[name = tensor("x_123_cast_fp16")]; tensor input_261_cast_fp16 = select(a = var_40_to_fp16, b = x_123_cast_fp16, cond = var_418)[name = tensor("input_261_cast_fp16")]; tensor new_x_19_interleave_0 = const()[name = tensor("new_x_19_interleave_0"), val = tensor(false)]; tensor new_x_19_cast_fp16 = concat(axis = var_62, interleave = new_x_19_interleave_0, values = (cache_19_cast_fp16, input_261_cast_fp16))[name = tensor("new_x_19_cast_fp16")]; tensor next_cache_9_begin_0 = const()[name = tensor("next_cache_9_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_9_end_0 = const()[name = tensor("next_cache_9_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_9_end_mask_0 = const()[name = tensor("next_cache_9_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_9_cast_fp16 = slice_by_index(begin = next_cache_9_begin_0, end = next_cache_9_end_0, end_mask = next_cache_9_end_mask_0, x = new_x_19_cast_fp16)[name = tensor("next_cache_9_cast_fp16")]; tensor var_1262_begin_0 = const()[name = tensor("op_1262_begin_0"), val = tensor([0, 0, 1])]; tensor var_1262_end_0 = const()[name = tensor("op_1262_end_0"), val = tensor([1, 512, 9])]; tensor var_1262_end_mask_0 = const()[name = tensor("op_1262_end_mask_0"), val = tensor([true, true, true])]; tensor var_1262_cast_fp16 = slice_by_index(begin = var_1262_begin_0, end = var_1262_end_0, end_mask = var_1262_end_mask_0, x = next_cache_9_cast_fp16)[name = tensor("op_1262_cast_fp16")]; tensor x_125_pad_type_0 = const()[name = tensor("x_125_pad_type_0"), val = tensor("valid")]; tensor x_125_groups_0 = const()[name = tensor("x_125_groups_0"), val = tensor(512)]; tensor x_125_strides_0 = const()[name = tensor("x_125_strides_0"), val = tensor([1])]; tensor x_125_pad_0 = const()[name = tensor("x_125_pad_0"), val = tensor([0, 0])]; tensor x_125_dilations_0 = const()[name = tensor("x_125_dilations_0"), val = tensor([1])]; tensor encoder_layers_4_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_4_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61169344)))]; tensor x_125_cast_fp16 = conv(dilations = x_125_dilations_0, groups = x_125_groups_0, pad = x_125_pad_0, pad_type = x_125_pad_type_0, strides = x_125_strides_0, weight = encoder_layers_4_conv_depthwise_conv_weight_to_fp16, x = new_x_19_cast_fp16)[name = tensor("x_125_cast_fp16")]; tensor input_263_perm_0 = const()[name = tensor("input_263_perm_0"), val = tensor([0, 2, 1])]; tensor x_127_axes_0 = const()[name = tensor("x_127_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_4_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61178624)))]; tensor encoder_layers_4_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_4_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61179712)))]; tensor input_263_cast_fp16 = transpose(perm = input_263_perm_0, x = x_125_cast_fp16)[name = tensor("transpose_196")]; tensor x_127_cast_fp16 = layer_norm(axes = x_127_axes_0, beta = encoder_layers_4_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_conv_batch_norm_weight_to_fp16, x = input_263_cast_fp16)[name = tensor("x_127_cast_fp16")]; tensor input_265_perm_0 = const()[name = tensor("input_265_perm_0"), val = tensor([0, 2, 1])]; tensor input_265_cast_fp16 = transpose(perm = input_265_perm_0, x = x_127_cast_fp16)[name = tensor("transpose_195")]; tensor input_267_cast_fp16 = silu(x = input_265_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor x_129_pad_type_0 = const()[name = tensor("x_129_pad_type_0"), val = tensor("valid")]; tensor x_129_strides_0 = const()[name = tensor("x_129_strides_0"), val = tensor([1])]; tensor x_129_pad_0 = const()[name = tensor("x_129_pad_0"), val = tensor([0, 0])]; tensor x_129_dilations_0 = const()[name = tensor("x_129_dilations_0"), val = tensor([1])]; tensor x_129_groups_0 = const()[name = tensor("x_129_groups_0"), val = tensor(1)]; tensor encoder_layers_4_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61180800)))]; tensor x_129_cast_fp16 = conv(dilations = x_129_dilations_0, groups = x_129_groups_0, pad = x_129_pad_0, pad_type = x_129_pad_type_0, strides = x_129_strides_0, weight = encoder_layers_4_conv_pointwise_conv2_weight_to_fp16, x = input_267_cast_fp16)[name = tensor("x_129_cast_fp16")]; tensor input_269_perm_0 = const()[name = tensor("input_269_perm_0"), val = tensor([0, 2, 1])]; tensor input_269_cast_fp16 = transpose(perm = input_269_perm_0, x = x_129_cast_fp16)[name = tensor("transpose_194")]; tensor input_271_cast_fp16 = add(x = input_255_cast_fp16, y = input_269_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor input_273_axes_0 = const()[name = tensor("input_273_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61705152)))]; tensor encoder_layers_4_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61706240)))]; tensor input_273_cast_fp16 = layer_norm(axes = input_273_axes_0, beta = encoder_layers_4_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_norm_feed_forward2_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor encoder_layers_4_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(61707328)))]; tensor linear_44_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_4_feed_forward2_linear1_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor input_277_cast_fp16 = silu(x = linear_44_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor encoder_layers_4_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_4_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63804544)))]; tensor linear_45_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_4_feed_forward2_linear2_weight_to_fp16, x = input_277_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor var_1303_to_fp16 = const()[name = tensor("op_1303_to_fp16"), val = tensor(0x1p-1)]; tensor var_1304_cast_fp16 = mul(x = linear_45_cast_fp16, y = var_1303_to_fp16)[name = tensor("op_1304_cast_fp16")]; tensor input_283_cast_fp16 = add(x = input_271_cast_fp16, y = var_1304_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor input_285_axes_0 = const()[name = tensor("input_285_axes_0"), val = tensor([-1])]; tensor encoder_layers_4_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_4_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65901760)))]; tensor encoder_layers_4_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_4_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65902848)))]; tensor input_285_cast_fp16 = layer_norm(axes = input_285_axes_0, beta = encoder_layers_4_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_4_norm_out_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor cache_21_begin_0 = const()[name = tensor("cache_21_begin_0"), val = tensor([5, 0, 0, 0])]; tensor cache_21_end_0 = const()[name = tensor("cache_21_end_0"), val = tensor([6, 1, 70, 512])]; tensor cache_21_end_mask_0 = const()[name = tensor("cache_21_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_21_squeeze_mask_0 = const()[name = tensor("cache_21_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_21_cast_fp16 = slice_by_index(begin = cache_21_begin_0, end = cache_21_end_0, end_mask = cache_21_end_mask_0, squeeze_mask = cache_21_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_21_cast_fp16")]; tensor cache_23_begin_0 = const()[name = tensor("cache_23_begin_0"), val = tensor([5, 0, 0, 0])]; tensor cache_23_end_0 = const()[name = tensor("cache_23_end_0"), val = tensor([6, 1, 512, 8])]; tensor cache_23_end_mask_0 = const()[name = tensor("cache_23_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_23_squeeze_mask_0 = const()[name = tensor("cache_23_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_23_cast_fp16 = slice_by_index(begin = cache_23_begin_0, end = cache_23_end_0, end_mask = cache_23_end_mask_0, squeeze_mask = cache_23_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_23_cast_fp16")]; tensor input_287_axes_0 = const()[name = tensor("input_287_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65903936)))]; tensor encoder_layers_5_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65905024)))]; tensor input_287_cast_fp16 = layer_norm(axes = input_287_axes_0, beta = encoder_layers_5_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_norm_feed_forward1_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("input_287_cast_fp16")]; tensor encoder_layers_5_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65906112)))]; tensor linear_46_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_5_feed_forward1_linear1_weight_to_fp16, x = input_287_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor input_291_cast_fp16 = silu(x = linear_46_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor encoder_layers_5_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68003328)))]; tensor linear_47_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_feed_forward1_linear2_weight_to_fp16, x = input_291_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor var_1338_to_fp16 = const()[name = tensor("op_1338_to_fp16"), val = tensor(0x1p-1)]; tensor var_1339_cast_fp16 = mul(x = linear_47_cast_fp16, y = var_1338_to_fp16)[name = tensor("op_1339_cast_fp16")]; tensor input_297_cast_fp16 = add(x = input_285_cast_fp16, y = var_1339_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor key_11_axes_0 = const()[name = tensor("key_11_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70100544)))]; tensor encoder_layers_5_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70101632)))]; tensor key_11_cast_fp16 = layer_norm(axes = key_11_axes_0, beta = encoder_layers_5_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_norm_self_att_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("key_11_cast_fp16")]; tensor input_299_interleave_0 = const()[name = tensor("input_299_interleave_0"), val = tensor(false)]; tensor input_299_cast_fp16 = concat(axis = var_64, interleave = input_299_interleave_0, values = (cache_21_cast_fp16, key_11_cast_fp16))[name = tensor("input_299_cast_fp16")]; tensor var_1361_begin_0 = const()[name = tensor("op_1361_begin_0"), val = tensor([0, 1, 0])]; tensor var_1361_end_0 = const()[name = tensor("op_1361_end_0"), val = tensor([1, 70, 512])]; tensor var_1361_end_mask_0 = const()[name = tensor("op_1361_end_mask_0"), val = tensor([true, true, true])]; tensor var_1361_cast_fp16 = slice_by_index(begin = var_1361_begin_0, end = var_1361_end_0, end_mask = var_1361_end_mask_0, x = cache_21_cast_fp16)[name = tensor("op_1361_cast_fp16")]; tensor var_1364_begin_0 = const()[name = tensor("op_1364_begin_0"), val = tensor([0, 0, 0])]; tensor var_1364_end_0 = const()[name = tensor("op_1364_end_0"), val = tensor([1, 1, 512])]; tensor var_1364_end_mask_0 = const()[name = tensor("op_1364_end_mask_0"), val = tensor([true, false, true])]; tensor var_1364_cast_fp16 = slice_by_index(begin = var_1364_begin_0, end = var_1364_end_0, end_mask = var_1364_end_mask_0, x = key_11_cast_fp16)[name = tensor("op_1364_cast_fp16")]; tensor var_1367_interleave_0 = const()[name = tensor("op_1367_interleave_0"), val = tensor(false)]; tensor var_1367_cast_fp16 = concat(axis = var_64, interleave = var_1367_interleave_0, values = (var_1361_cast_fp16, var_1364_cast_fp16))[name = tensor("op_1367_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70102720)))]; tensor linear_48_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_self_attn_linear_q_weight_to_fp16, x = key_11_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor var_1371 = const()[name = tensor("op_1371"), val = tensor([1, -1, 8, 64])]; tensor q_31_cast_fp16 = reshape(shape = var_1371, x = linear_48_cast_fp16)[name = tensor("q_31_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(70627072)))]; tensor linear_49_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_self_attn_linear_k_weight_to_fp16, x = input_299_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor var_1375 = const()[name = tensor("op_1375"), val = tensor([1, -1, 8, 64])]; tensor k_21_cast_fp16 = reshape(shape = var_1375, x = linear_49_cast_fp16)[name = tensor("k_21_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(71151424)))]; tensor linear_50_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_self_attn_linear_v_weight_to_fp16, x = input_299_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_1379 = const()[name = tensor("op_1379"), val = tensor([1, -1, 8, 64])]; tensor v_11_cast_fp16 = reshape(shape = var_1379, x = linear_50_cast_fp16)[name = tensor("v_11_cast_fp16")]; tensor value_13_perm_0 = const()[name = tensor("value_13_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_5_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(71675776)))]; tensor var_1391_cast_fp16 = add(x = q_31_cast_fp16, y = encoder_layers_5_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1391_cast_fp16")]; tensor encoder_layers_5_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(71676864)))]; tensor var_1393_cast_fp16 = add(x = q_31_cast_fp16, y = encoder_layers_5_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1393_cast_fp16")]; tensor q_with_bias_v_11_perm_0 = const()[name = tensor("q_with_bias_v_11_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_137_transpose_x_0 = const()[name = tensor("x_137_transpose_x_0"), val = tensor(false)]; tensor x_137_transpose_y_0 = const()[name = tensor("x_137_transpose_y_0"), val = tensor(false)]; tensor var_1395_to_fp16 = const()[name = tensor("op_1395_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(71677952)))]; tensor q_with_bias_v_11_cast_fp16 = transpose(perm = q_with_bias_v_11_perm_0, x = var_1393_cast_fp16)[name = tensor("transpose_192")]; tensor x_137_cast_fp16 = matmul(transpose_x = x_137_transpose_x_0, transpose_y = x_137_transpose_y_0, x = q_with_bias_v_11_cast_fp16, y = var_1395_to_fp16)[name = tensor("x_137_cast_fp16")]; tensor x_139_pad_0 = const()[name = tensor("x_139_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_139_mode_0 = const()[name = tensor("x_139_mode_0"), val = tensor("constant")]; tensor const_88_to_fp16 = const()[name = tensor("const_88_to_fp16"), val = tensor(0x0p+0)]; tensor x_139_cast_fp16 = pad(constant_val = const_88_to_fp16, mode = x_139_mode_0, pad = x_139_pad_0, x = x_137_cast_fp16)[name = tensor("x_139_cast_fp16")]; tensor var_1403 = const()[name = tensor("op_1403"), val = tensor([1, 8, -1, 3])]; tensor x_141_cast_fp16 = reshape(shape = var_1403, x = x_139_cast_fp16)[name = tensor("x_141_cast_fp16")]; tensor var_1407_begin_0 = const()[name = tensor("op_1407_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1407_end_0 = const()[name = tensor("op_1407_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_1407_end_mask_0 = const()[name = tensor("op_1407_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1407_cast_fp16 = slice_by_index(begin = var_1407_begin_0, end = var_1407_end_0, end_mask = var_1407_end_mask_0, x = x_141_cast_fp16)[name = tensor("op_1407_cast_fp16")]; tensor var_1408 = const()[name = tensor("op_1408"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_21_cast_fp16 = reshape(shape = var_1408, x = var_1407_cast_fp16)[name = tensor("matrix_bd_21_cast_fp16")]; tensor matrix_ac_11_transpose_x_0 = const()[name = tensor("matrix_ac_11_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_11_transpose_y_0 = const()[name = tensor("matrix_ac_11_transpose_y_0"), val = tensor(false)]; tensor transpose_61_perm_0 = const()[name = tensor("transpose_61_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_62_perm_0 = const()[name = tensor("transpose_62_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_62 = transpose(perm = transpose_62_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_190")]; tensor transpose_61 = transpose(perm = transpose_61_perm_0, x = var_1391_cast_fp16)[name = tensor("transpose_191")]; tensor matrix_ac_11_cast_fp16 = matmul(transpose_x = matrix_ac_11_transpose_x_0, transpose_y = matrix_ac_11_transpose_y_0, x = transpose_61, y = transpose_62)[name = tensor("matrix_ac_11_cast_fp16")]; tensor matrix_bd_23_begin_0 = const()[name = tensor("matrix_bd_23_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_23_end_0 = const()[name = tensor("matrix_bd_23_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_23_end_mask_0 = const()[name = tensor("matrix_bd_23_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_23_cast_fp16 = slice_by_index(begin = matrix_bd_23_begin_0, end = matrix_bd_23_end_0, end_mask = matrix_bd_23_end_mask_0, x = matrix_bd_21_cast_fp16)[name = tensor("matrix_bd_23_cast_fp16")]; tensor var_1417_cast_fp16 = add(x = matrix_ac_11_cast_fp16, y = matrix_bd_23_cast_fp16)[name = tensor("op_1417_cast_fp16")]; tensor _inversed_scores_21_y_0_to_fp16 = const()[name = tensor("_inversed_scores_21_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_21_cast_fp16 = mul(x = var_1417_cast_fp16, y = _inversed_scores_21_y_0_to_fp16)[name = tensor("_inversed_scores_21_cast_fp16")]; tensor scores_23_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_21_cast_fp16, cond = mask_3)[name = tensor("scores_23_cast_fp16")]; tensor var_1423_cast_fp16 = softmax(axis = var_62, x = scores_23_cast_fp16)[name = tensor("op_1423_cast_fp16")]; tensor input_301_cast_fp16 = select(a = var_40_to_fp16, b = var_1423_cast_fp16, cond = mask_3)[name = tensor("input_301_cast_fp16")]; tensor x_143_transpose_x_0 = const()[name = tensor("x_143_transpose_x_0"), val = tensor(false)]; tensor x_143_transpose_y_0 = const()[name = tensor("x_143_transpose_y_0"), val = tensor(false)]; tensor value_13_cast_fp16 = transpose(perm = value_13_perm_0, x = v_11_cast_fp16)[name = tensor("transpose_193")]; tensor x_143_cast_fp16 = matmul(transpose_x = x_143_transpose_x_0, transpose_y = x_143_transpose_y_0, x = input_301_cast_fp16, y = value_13_cast_fp16)[name = tensor("x_143_cast_fp16")]; tensor var_1427_perm_0 = const()[name = tensor("op_1427_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1428 = const()[name = tensor("op_1428"), val = tensor([1, -1, 512])]; tensor var_1427_cast_fp16 = transpose(perm = var_1427_perm_0, x = x_143_cast_fp16)[name = tensor("transpose_189")]; tensor input_303_cast_fp16 = reshape(shape = var_1428, x = var_1427_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor encoder_layers_5_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_5_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(71826496)))]; tensor linear_52_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_self_attn_linear_out_weight_to_fp16, x = input_303_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor input_307_cast_fp16 = add(x = input_297_cast_fp16, y = linear_52_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor x_147_axes_0 = const()[name = tensor("x_147_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72350848)))]; tensor encoder_layers_5_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72351936)))]; tensor x_147_cast_fp16 = layer_norm(axes = x_147_axes_0, beta = encoder_layers_5_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_norm_conv_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("x_147_cast_fp16")]; tensor input_309_perm_0 = const()[name = tensor("input_309_perm_0"), val = tensor([0, 2, 1])]; tensor input_311_pad_type_0 = const()[name = tensor("input_311_pad_type_0"), val = tensor("valid")]; tensor input_311_strides_0 = const()[name = tensor("input_311_strides_0"), val = tensor([1])]; tensor input_311_pad_0 = const()[name = tensor("input_311_pad_0"), val = tensor([0, 0])]; tensor input_311_dilations_0 = const()[name = tensor("input_311_dilations_0"), val = tensor([1])]; tensor input_311_groups_0 = const()[name = tensor("input_311_groups_0"), val = tensor(1)]; tensor encoder_layers_5_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72353024)))]; tensor input_309_cast_fp16 = transpose(perm = input_309_perm_0, x = x_147_cast_fp16)[name = tensor("transpose_188")]; tensor input_311_cast_fp16 = conv(dilations = input_311_dilations_0, groups = input_311_groups_0, pad = input_311_pad_0, pad_type = input_311_pad_type_0, strides = input_311_strides_0, weight = encoder_layers_5_conv_pointwise_conv1_weight_to_fp16, x = input_309_cast_fp16)[name = tensor("input_311_cast_fp16")]; tensor x_149_split_num_splits_0 = const()[name = tensor("x_149_split_num_splits_0"), val = tensor(2)]; tensor x_149_split_axis_0 = const()[name = tensor("x_149_split_axis_0"), val = tensor(1)]; tensor x_149_split_cast_fp16_0, tensor x_149_split_cast_fp16_1 = split(axis = x_149_split_axis_0, num_splits = x_149_split_num_splits_0, x = input_311_cast_fp16)[name = tensor("x_149_split_cast_fp16")]; tensor x_149_split_1_sigmoid_cast_fp16 = sigmoid(x = x_149_split_cast_fp16_1)[name = tensor("x_149_split_1_sigmoid_cast_fp16")]; tensor x_149_cast_fp16 = mul(x = x_149_split_cast_fp16_0, y = x_149_split_1_sigmoid_cast_fp16)[name = tensor("x_149_cast_fp16")]; tensor input_313_cast_fp16 = select(a = var_40_to_fp16, b = x_149_cast_fp16, cond = var_418)[name = tensor("input_313_cast_fp16")]; tensor new_x_23_interleave_0 = const()[name = tensor("new_x_23_interleave_0"), val = tensor(false)]; tensor new_x_23_cast_fp16 = concat(axis = var_62, interleave = new_x_23_interleave_0, values = (cache_23_cast_fp16, input_313_cast_fp16))[name = tensor("new_x_23_cast_fp16")]; tensor next_cache_11_begin_0 = const()[name = tensor("next_cache_11_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_11_end_0 = const()[name = tensor("next_cache_11_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_11_end_mask_0 = const()[name = tensor("next_cache_11_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_11_cast_fp16 = slice_by_index(begin = next_cache_11_begin_0, end = next_cache_11_end_0, end_mask = next_cache_11_end_mask_0, x = new_x_23_cast_fp16)[name = tensor("next_cache_11_cast_fp16")]; tensor var_1469_begin_0 = const()[name = tensor("op_1469_begin_0"), val = tensor([0, 0, 1])]; tensor var_1469_end_0 = const()[name = tensor("op_1469_end_0"), val = tensor([1, 512, 9])]; tensor var_1469_end_mask_0 = const()[name = tensor("op_1469_end_mask_0"), val = tensor([true, true, true])]; tensor var_1469_cast_fp16 = slice_by_index(begin = var_1469_begin_0, end = var_1469_end_0, end_mask = var_1469_end_mask_0, x = next_cache_11_cast_fp16)[name = tensor("op_1469_cast_fp16")]; tensor x_151_pad_type_0 = const()[name = tensor("x_151_pad_type_0"), val = tensor("valid")]; tensor x_151_groups_0 = const()[name = tensor("x_151_groups_0"), val = tensor(512)]; tensor x_151_strides_0 = const()[name = tensor("x_151_strides_0"), val = tensor([1])]; tensor x_151_pad_0 = const()[name = tensor("x_151_pad_0"), val = tensor([0, 0])]; tensor x_151_dilations_0 = const()[name = tensor("x_151_dilations_0"), val = tensor([1])]; tensor encoder_layers_5_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_5_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73401664)))]; tensor x_151_cast_fp16 = conv(dilations = x_151_dilations_0, groups = x_151_groups_0, pad = x_151_pad_0, pad_type = x_151_pad_type_0, strides = x_151_strides_0, weight = encoder_layers_5_conv_depthwise_conv_weight_to_fp16, x = new_x_23_cast_fp16)[name = tensor("x_151_cast_fp16")]; tensor input_315_perm_0 = const()[name = tensor("input_315_perm_0"), val = tensor([0, 2, 1])]; tensor x_153_axes_0 = const()[name = tensor("x_153_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_5_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73410944)))]; tensor encoder_layers_5_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_5_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73412032)))]; tensor input_315_cast_fp16 = transpose(perm = input_315_perm_0, x = x_151_cast_fp16)[name = tensor("transpose_187")]; tensor x_153_cast_fp16 = layer_norm(axes = x_153_axes_0, beta = encoder_layers_5_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_conv_batch_norm_weight_to_fp16, x = input_315_cast_fp16)[name = tensor("x_153_cast_fp16")]; tensor input_317_perm_0 = const()[name = tensor("input_317_perm_0"), val = tensor([0, 2, 1])]; tensor input_317_cast_fp16 = transpose(perm = input_317_perm_0, x = x_153_cast_fp16)[name = tensor("transpose_186")]; tensor input_319_cast_fp16 = silu(x = input_317_cast_fp16)[name = tensor("input_319_cast_fp16")]; tensor x_155_pad_type_0 = const()[name = tensor("x_155_pad_type_0"), val = tensor("valid")]; tensor x_155_strides_0 = const()[name = tensor("x_155_strides_0"), val = tensor([1])]; tensor x_155_pad_0 = const()[name = tensor("x_155_pad_0"), val = tensor([0, 0])]; tensor x_155_dilations_0 = const()[name = tensor("x_155_dilations_0"), val = tensor([1])]; tensor x_155_groups_0 = const()[name = tensor("x_155_groups_0"), val = tensor(1)]; tensor encoder_layers_5_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73413120)))]; tensor x_155_cast_fp16 = conv(dilations = x_155_dilations_0, groups = x_155_groups_0, pad = x_155_pad_0, pad_type = x_155_pad_type_0, strides = x_155_strides_0, weight = encoder_layers_5_conv_pointwise_conv2_weight_to_fp16, x = input_319_cast_fp16)[name = tensor("x_155_cast_fp16")]; tensor input_321_perm_0 = const()[name = tensor("input_321_perm_0"), val = tensor([0, 2, 1])]; tensor input_321_cast_fp16 = transpose(perm = input_321_perm_0, x = x_155_cast_fp16)[name = tensor("transpose_185")]; tensor input_323_cast_fp16 = add(x = input_307_cast_fp16, y = input_321_cast_fp16)[name = tensor("input_323_cast_fp16")]; tensor input_325_axes_0 = const()[name = tensor("input_325_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73937472)))]; tensor encoder_layers_5_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73938560)))]; tensor input_325_cast_fp16 = layer_norm(axes = input_325_axes_0, beta = encoder_layers_5_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_norm_feed_forward2_weight_to_fp16, x = input_323_cast_fp16)[name = tensor("input_325_cast_fp16")]; tensor encoder_layers_5_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(73939648)))]; tensor linear_53_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_5_feed_forward2_linear1_weight_to_fp16, x = input_325_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor input_329_cast_fp16 = silu(x = linear_53_cast_fp16)[name = tensor("input_329_cast_fp16")]; tensor encoder_layers_5_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_5_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76036864)))]; tensor linear_54_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_5_feed_forward2_linear2_weight_to_fp16, x = input_329_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor var_1510_to_fp16 = const()[name = tensor("op_1510_to_fp16"), val = tensor(0x1p-1)]; tensor var_1511_cast_fp16 = mul(x = linear_54_cast_fp16, y = var_1510_to_fp16)[name = tensor("op_1511_cast_fp16")]; tensor input_335_cast_fp16 = add(x = input_323_cast_fp16, y = var_1511_cast_fp16)[name = tensor("input_335_cast_fp16")]; tensor input_337_axes_0 = const()[name = tensor("input_337_axes_0"), val = tensor([-1])]; tensor encoder_layers_5_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_5_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78134080)))]; tensor encoder_layers_5_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_5_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78135168)))]; tensor input_337_cast_fp16 = layer_norm(axes = input_337_axes_0, beta = encoder_layers_5_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_5_norm_out_weight_to_fp16, x = input_335_cast_fp16)[name = tensor("input_337_cast_fp16")]; tensor cache_25_begin_0 = const()[name = tensor("cache_25_begin_0"), val = tensor([6, 0, 0, 0])]; tensor cache_25_end_0 = const()[name = tensor("cache_25_end_0"), val = tensor([7, 1, 70, 512])]; tensor cache_25_end_mask_0 = const()[name = tensor("cache_25_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_25_squeeze_mask_0 = const()[name = tensor("cache_25_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_25_cast_fp16 = slice_by_index(begin = cache_25_begin_0, end = cache_25_end_0, end_mask = cache_25_end_mask_0, squeeze_mask = cache_25_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_25_cast_fp16")]; tensor cache_27_begin_0 = const()[name = tensor("cache_27_begin_0"), val = tensor([6, 0, 0, 0])]; tensor cache_27_end_0 = const()[name = tensor("cache_27_end_0"), val = tensor([7, 1, 512, 8])]; tensor cache_27_end_mask_0 = const()[name = tensor("cache_27_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_27_squeeze_mask_0 = const()[name = tensor("cache_27_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_27_cast_fp16 = slice_by_index(begin = cache_27_begin_0, end = cache_27_end_0, end_mask = cache_27_end_mask_0, squeeze_mask = cache_27_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_27_cast_fp16")]; tensor input_339_axes_0 = const()[name = tensor("input_339_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78136256)))]; tensor encoder_layers_6_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78137344)))]; tensor input_339_cast_fp16 = layer_norm(axes = input_339_axes_0, beta = encoder_layers_6_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_norm_feed_forward1_weight_to_fp16, x = input_337_cast_fp16)[name = tensor("input_339_cast_fp16")]; tensor encoder_layers_6_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78138432)))]; tensor linear_55_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_6_feed_forward1_linear1_weight_to_fp16, x = input_339_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor input_343_cast_fp16 = silu(x = linear_55_cast_fp16)[name = tensor("input_343_cast_fp16")]; tensor encoder_layers_6_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80235648)))]; tensor linear_56_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_feed_forward1_linear2_weight_to_fp16, x = input_343_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor var_1545_to_fp16 = const()[name = tensor("op_1545_to_fp16"), val = tensor(0x1p-1)]; tensor var_1546_cast_fp16 = mul(x = linear_56_cast_fp16, y = var_1545_to_fp16)[name = tensor("op_1546_cast_fp16")]; tensor input_349_cast_fp16 = add(x = input_337_cast_fp16, y = var_1546_cast_fp16)[name = tensor("input_349_cast_fp16")]; tensor key_13_axes_0 = const()[name = tensor("key_13_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82332864)))]; tensor encoder_layers_6_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82333952)))]; tensor key_13_cast_fp16 = layer_norm(axes = key_13_axes_0, beta = encoder_layers_6_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_norm_self_att_weight_to_fp16, x = input_349_cast_fp16)[name = tensor("key_13_cast_fp16")]; tensor input_351_interleave_0 = const()[name = tensor("input_351_interleave_0"), val = tensor(false)]; tensor input_351_cast_fp16 = concat(axis = var_64, interleave = input_351_interleave_0, values = (cache_25_cast_fp16, key_13_cast_fp16))[name = tensor("input_351_cast_fp16")]; tensor var_1568_begin_0 = const()[name = tensor("op_1568_begin_0"), val = tensor([0, 1, 0])]; tensor var_1568_end_0 = const()[name = tensor("op_1568_end_0"), val = tensor([1, 70, 512])]; tensor var_1568_end_mask_0 = const()[name = tensor("op_1568_end_mask_0"), val = tensor([true, true, true])]; tensor var_1568_cast_fp16 = slice_by_index(begin = var_1568_begin_0, end = var_1568_end_0, end_mask = var_1568_end_mask_0, x = cache_25_cast_fp16)[name = tensor("op_1568_cast_fp16")]; tensor var_1571_begin_0 = const()[name = tensor("op_1571_begin_0"), val = tensor([0, 0, 0])]; tensor var_1571_end_0 = const()[name = tensor("op_1571_end_0"), val = tensor([1, 1, 512])]; tensor var_1571_end_mask_0 = const()[name = tensor("op_1571_end_mask_0"), val = tensor([true, false, true])]; tensor var_1571_cast_fp16 = slice_by_index(begin = var_1571_begin_0, end = var_1571_end_0, end_mask = var_1571_end_mask_0, x = key_13_cast_fp16)[name = tensor("op_1571_cast_fp16")]; tensor var_1574_interleave_0 = const()[name = tensor("op_1574_interleave_0"), val = tensor(false)]; tensor var_1574_cast_fp16 = concat(axis = var_64, interleave = var_1574_interleave_0, values = (var_1568_cast_fp16, var_1571_cast_fp16))[name = tensor("op_1574_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82335040)))]; tensor linear_57_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_self_attn_linear_q_weight_to_fp16, x = key_13_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor var_1578 = const()[name = tensor("op_1578"), val = tensor([1, -1, 8, 64])]; tensor q_37_cast_fp16 = reshape(shape = var_1578, x = linear_57_cast_fp16)[name = tensor("q_37_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82859392)))]; tensor linear_58_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_self_attn_linear_k_weight_to_fp16, x = input_351_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor var_1582 = const()[name = tensor("op_1582"), val = tensor([1, -1, 8, 64])]; tensor k_25_cast_fp16 = reshape(shape = var_1582, x = linear_58_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83383744)))]; tensor linear_59_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_self_attn_linear_v_weight_to_fp16, x = input_351_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor var_1586 = const()[name = tensor("op_1586"), val = tensor([1, -1, 8, 64])]; tensor v_13_cast_fp16 = reshape(shape = var_1586, x = linear_59_cast_fp16)[name = tensor("v_13_cast_fp16")]; tensor value_15_perm_0 = const()[name = tensor("value_15_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_6_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83908096)))]; tensor var_1598_cast_fp16 = add(x = q_37_cast_fp16, y = encoder_layers_6_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1598_cast_fp16")]; tensor encoder_layers_6_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83909184)))]; tensor var_1600_cast_fp16 = add(x = q_37_cast_fp16, y = encoder_layers_6_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1600_cast_fp16")]; tensor q_with_bias_v_13_perm_0 = const()[name = tensor("q_with_bias_v_13_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_163_transpose_x_0 = const()[name = tensor("x_163_transpose_x_0"), val = tensor(false)]; tensor x_163_transpose_y_0 = const()[name = tensor("x_163_transpose_y_0"), val = tensor(false)]; tensor var_1602_to_fp16 = const()[name = tensor("op_1602_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83910272)))]; tensor q_with_bias_v_13_cast_fp16 = transpose(perm = q_with_bias_v_13_perm_0, x = var_1600_cast_fp16)[name = tensor("transpose_183")]; tensor x_163_cast_fp16 = matmul(transpose_x = x_163_transpose_x_0, transpose_y = x_163_transpose_y_0, x = q_with_bias_v_13_cast_fp16, y = var_1602_to_fp16)[name = tensor("x_163_cast_fp16")]; tensor x_165_pad_0 = const()[name = tensor("x_165_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_165_mode_0 = const()[name = tensor("x_165_mode_0"), val = tensor("constant")]; tensor const_101_to_fp16 = const()[name = tensor("const_101_to_fp16"), val = tensor(0x0p+0)]; tensor x_165_cast_fp16 = pad(constant_val = const_101_to_fp16, mode = x_165_mode_0, pad = x_165_pad_0, x = x_163_cast_fp16)[name = tensor("x_165_cast_fp16")]; tensor var_1610 = const()[name = tensor("op_1610"), val = tensor([1, 8, -1, 3])]; tensor x_167_cast_fp16 = reshape(shape = var_1610, x = x_165_cast_fp16)[name = tensor("x_167_cast_fp16")]; tensor var_1614_begin_0 = const()[name = tensor("op_1614_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1614_end_0 = const()[name = tensor("op_1614_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_1614_end_mask_0 = const()[name = tensor("op_1614_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1614_cast_fp16 = slice_by_index(begin = var_1614_begin_0, end = var_1614_end_0, end_mask = var_1614_end_mask_0, x = x_167_cast_fp16)[name = tensor("op_1614_cast_fp16")]; tensor var_1615 = const()[name = tensor("op_1615"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_25_cast_fp16 = reshape(shape = var_1615, x = var_1614_cast_fp16)[name = tensor("matrix_bd_25_cast_fp16")]; tensor matrix_ac_13_transpose_x_0 = const()[name = tensor("matrix_ac_13_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_13_transpose_y_0 = const()[name = tensor("matrix_ac_13_transpose_y_0"), val = tensor(false)]; tensor transpose_63_perm_0 = const()[name = tensor("transpose_63_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_64_perm_0 = const()[name = tensor("transpose_64_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_64 = transpose(perm = transpose_64_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_181")]; tensor transpose_63 = transpose(perm = transpose_63_perm_0, x = var_1598_cast_fp16)[name = tensor("transpose_182")]; tensor matrix_ac_13_cast_fp16 = matmul(transpose_x = matrix_ac_13_transpose_x_0, transpose_y = matrix_ac_13_transpose_y_0, x = transpose_63, y = transpose_64)[name = tensor("matrix_ac_13_cast_fp16")]; tensor matrix_bd_27_begin_0 = const()[name = tensor("matrix_bd_27_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_27_end_0 = const()[name = tensor("matrix_bd_27_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_27_end_mask_0 = const()[name = tensor("matrix_bd_27_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_27_cast_fp16 = slice_by_index(begin = matrix_bd_27_begin_0, end = matrix_bd_27_end_0, end_mask = matrix_bd_27_end_mask_0, x = matrix_bd_25_cast_fp16)[name = tensor("matrix_bd_27_cast_fp16")]; tensor var_1624_cast_fp16 = add(x = matrix_ac_13_cast_fp16, y = matrix_bd_27_cast_fp16)[name = tensor("op_1624_cast_fp16")]; tensor _inversed_scores_25_y_0_to_fp16 = const()[name = tensor("_inversed_scores_25_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_25_cast_fp16 = mul(x = var_1624_cast_fp16, y = _inversed_scores_25_y_0_to_fp16)[name = tensor("_inversed_scores_25_cast_fp16")]; tensor scores_27_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_25_cast_fp16, cond = mask_3)[name = tensor("scores_27_cast_fp16")]; tensor var_1630_cast_fp16 = softmax(axis = var_62, x = scores_27_cast_fp16)[name = tensor("op_1630_cast_fp16")]; tensor input_353_cast_fp16 = select(a = var_40_to_fp16, b = var_1630_cast_fp16, cond = mask_3)[name = tensor("input_353_cast_fp16")]; tensor x_169_transpose_x_0 = const()[name = tensor("x_169_transpose_x_0"), val = tensor(false)]; tensor x_169_transpose_y_0 = const()[name = tensor("x_169_transpose_y_0"), val = tensor(false)]; tensor value_15_cast_fp16 = transpose(perm = value_15_perm_0, x = v_13_cast_fp16)[name = tensor("transpose_184")]; tensor x_169_cast_fp16 = matmul(transpose_x = x_169_transpose_x_0, transpose_y = x_169_transpose_y_0, x = input_353_cast_fp16, y = value_15_cast_fp16)[name = tensor("x_169_cast_fp16")]; tensor var_1634_perm_0 = const()[name = tensor("op_1634_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1635 = const()[name = tensor("op_1635"), val = tensor([1, -1, 512])]; tensor var_1634_cast_fp16 = transpose(perm = var_1634_perm_0, x = x_169_cast_fp16)[name = tensor("transpose_180")]; tensor input_355_cast_fp16 = reshape(shape = var_1635, x = var_1634_cast_fp16)[name = tensor("input_355_cast_fp16")]; tensor encoder_layers_6_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_6_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84058816)))]; tensor linear_61_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_self_attn_linear_out_weight_to_fp16, x = input_355_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor input_359_cast_fp16 = add(x = input_349_cast_fp16, y = linear_61_cast_fp16)[name = tensor("input_359_cast_fp16")]; tensor x_173_axes_0 = const()[name = tensor("x_173_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84583168)))]; tensor encoder_layers_6_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84584256)))]; tensor x_173_cast_fp16 = layer_norm(axes = x_173_axes_0, beta = encoder_layers_6_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_norm_conv_weight_to_fp16, x = input_359_cast_fp16)[name = tensor("x_173_cast_fp16")]; tensor input_361_perm_0 = const()[name = tensor("input_361_perm_0"), val = tensor([0, 2, 1])]; tensor input_363_pad_type_0 = const()[name = tensor("input_363_pad_type_0"), val = tensor("valid")]; tensor input_363_strides_0 = const()[name = tensor("input_363_strides_0"), val = tensor([1])]; tensor input_363_pad_0 = const()[name = tensor("input_363_pad_0"), val = tensor([0, 0])]; tensor input_363_dilations_0 = const()[name = tensor("input_363_dilations_0"), val = tensor([1])]; tensor input_363_groups_0 = const()[name = tensor("input_363_groups_0"), val = tensor(1)]; tensor encoder_layers_6_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84585344)))]; tensor input_361_cast_fp16 = transpose(perm = input_361_perm_0, x = x_173_cast_fp16)[name = tensor("transpose_179")]; tensor input_363_cast_fp16 = conv(dilations = input_363_dilations_0, groups = input_363_groups_0, pad = input_363_pad_0, pad_type = input_363_pad_type_0, strides = input_363_strides_0, weight = encoder_layers_6_conv_pointwise_conv1_weight_to_fp16, x = input_361_cast_fp16)[name = tensor("input_363_cast_fp16")]; tensor x_175_split_num_splits_0 = const()[name = tensor("x_175_split_num_splits_0"), val = tensor(2)]; tensor x_175_split_axis_0 = const()[name = tensor("x_175_split_axis_0"), val = tensor(1)]; tensor x_175_split_cast_fp16_0, tensor x_175_split_cast_fp16_1 = split(axis = x_175_split_axis_0, num_splits = x_175_split_num_splits_0, x = input_363_cast_fp16)[name = tensor("x_175_split_cast_fp16")]; tensor x_175_split_1_sigmoid_cast_fp16 = sigmoid(x = x_175_split_cast_fp16_1)[name = tensor("x_175_split_1_sigmoid_cast_fp16")]; tensor x_175_cast_fp16 = mul(x = x_175_split_cast_fp16_0, y = x_175_split_1_sigmoid_cast_fp16)[name = tensor("x_175_cast_fp16")]; tensor input_365_cast_fp16 = select(a = var_40_to_fp16, b = x_175_cast_fp16, cond = var_418)[name = tensor("input_365_cast_fp16")]; tensor new_x_27_interleave_0 = const()[name = tensor("new_x_27_interleave_0"), val = tensor(false)]; tensor new_x_27_cast_fp16 = concat(axis = var_62, interleave = new_x_27_interleave_0, values = (cache_27_cast_fp16, input_365_cast_fp16))[name = tensor("new_x_27_cast_fp16")]; tensor next_cache_13_begin_0 = const()[name = tensor("next_cache_13_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_13_end_0 = const()[name = tensor("next_cache_13_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_13_end_mask_0 = const()[name = tensor("next_cache_13_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_13_cast_fp16 = slice_by_index(begin = next_cache_13_begin_0, end = next_cache_13_end_0, end_mask = next_cache_13_end_mask_0, x = new_x_27_cast_fp16)[name = tensor("next_cache_13_cast_fp16")]; tensor var_1676_begin_0 = const()[name = tensor("op_1676_begin_0"), val = tensor([0, 0, 1])]; tensor var_1676_end_0 = const()[name = tensor("op_1676_end_0"), val = tensor([1, 512, 9])]; tensor var_1676_end_mask_0 = const()[name = tensor("op_1676_end_mask_0"), val = tensor([true, true, true])]; tensor var_1676_cast_fp16 = slice_by_index(begin = var_1676_begin_0, end = var_1676_end_0, end_mask = var_1676_end_mask_0, x = next_cache_13_cast_fp16)[name = tensor("op_1676_cast_fp16")]; tensor x_177_pad_type_0 = const()[name = tensor("x_177_pad_type_0"), val = tensor("valid")]; tensor x_177_groups_0 = const()[name = tensor("x_177_groups_0"), val = tensor(512)]; tensor x_177_strides_0 = const()[name = tensor("x_177_strides_0"), val = tensor([1])]; tensor x_177_pad_0 = const()[name = tensor("x_177_pad_0"), val = tensor([0, 0])]; tensor x_177_dilations_0 = const()[name = tensor("x_177_dilations_0"), val = tensor([1])]; tensor encoder_layers_6_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_6_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85633984)))]; tensor x_177_cast_fp16 = conv(dilations = x_177_dilations_0, groups = x_177_groups_0, pad = x_177_pad_0, pad_type = x_177_pad_type_0, strides = x_177_strides_0, weight = encoder_layers_6_conv_depthwise_conv_weight_to_fp16, x = new_x_27_cast_fp16)[name = tensor("x_177_cast_fp16")]; tensor input_367_perm_0 = const()[name = tensor("input_367_perm_0"), val = tensor([0, 2, 1])]; tensor x_179_axes_0 = const()[name = tensor("x_179_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_6_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85643264)))]; tensor encoder_layers_6_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_6_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85644352)))]; tensor input_367_cast_fp16 = transpose(perm = input_367_perm_0, x = x_177_cast_fp16)[name = tensor("transpose_178")]; tensor x_179_cast_fp16 = layer_norm(axes = x_179_axes_0, beta = encoder_layers_6_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_conv_batch_norm_weight_to_fp16, x = input_367_cast_fp16)[name = tensor("x_179_cast_fp16")]; tensor input_369_perm_0 = const()[name = tensor("input_369_perm_0"), val = tensor([0, 2, 1])]; tensor input_369_cast_fp16 = transpose(perm = input_369_perm_0, x = x_179_cast_fp16)[name = tensor("transpose_177")]; tensor input_371_cast_fp16 = silu(x = input_369_cast_fp16)[name = tensor("input_371_cast_fp16")]; tensor x_181_pad_type_0 = const()[name = tensor("x_181_pad_type_0"), val = tensor("valid")]; tensor x_181_strides_0 = const()[name = tensor("x_181_strides_0"), val = tensor([1])]; tensor x_181_pad_0 = const()[name = tensor("x_181_pad_0"), val = tensor([0, 0])]; tensor x_181_dilations_0 = const()[name = tensor("x_181_dilations_0"), val = tensor([1])]; tensor x_181_groups_0 = const()[name = tensor("x_181_groups_0"), val = tensor(1)]; tensor encoder_layers_6_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85645440)))]; tensor x_181_cast_fp16 = conv(dilations = x_181_dilations_0, groups = x_181_groups_0, pad = x_181_pad_0, pad_type = x_181_pad_type_0, strides = x_181_strides_0, weight = encoder_layers_6_conv_pointwise_conv2_weight_to_fp16, x = input_371_cast_fp16)[name = tensor("x_181_cast_fp16")]; tensor input_373_perm_0 = const()[name = tensor("input_373_perm_0"), val = tensor([0, 2, 1])]; tensor input_373_cast_fp16 = transpose(perm = input_373_perm_0, x = x_181_cast_fp16)[name = tensor("transpose_176")]; tensor input_375_cast_fp16 = add(x = input_359_cast_fp16, y = input_373_cast_fp16)[name = tensor("input_375_cast_fp16")]; tensor input_377_axes_0 = const()[name = tensor("input_377_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86169792)))]; tensor encoder_layers_6_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86170880)))]; tensor input_377_cast_fp16 = layer_norm(axes = input_377_axes_0, beta = encoder_layers_6_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_norm_feed_forward2_weight_to_fp16, x = input_375_cast_fp16)[name = tensor("input_377_cast_fp16")]; tensor encoder_layers_6_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(86171968)))]; tensor linear_62_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_6_feed_forward2_linear1_weight_to_fp16, x = input_377_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor input_381_cast_fp16 = silu(x = linear_62_cast_fp16)[name = tensor("input_381_cast_fp16")]; tensor encoder_layers_6_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_6_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(88269184)))]; tensor linear_63_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_6_feed_forward2_linear2_weight_to_fp16, x = input_381_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor var_1717_to_fp16 = const()[name = tensor("op_1717_to_fp16"), val = tensor(0x1p-1)]; tensor var_1718_cast_fp16 = mul(x = linear_63_cast_fp16, y = var_1717_to_fp16)[name = tensor("op_1718_cast_fp16")]; tensor input_387_cast_fp16 = add(x = input_375_cast_fp16, y = var_1718_cast_fp16)[name = tensor("input_387_cast_fp16")]; tensor input_389_axes_0 = const()[name = tensor("input_389_axes_0"), val = tensor([-1])]; tensor encoder_layers_6_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_6_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90366400)))]; tensor encoder_layers_6_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_6_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90367488)))]; tensor input_389_cast_fp16 = layer_norm(axes = input_389_axes_0, beta = encoder_layers_6_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_6_norm_out_weight_to_fp16, x = input_387_cast_fp16)[name = tensor("input_389_cast_fp16")]; tensor cache_29_begin_0 = const()[name = tensor("cache_29_begin_0"), val = tensor([7, 0, 0, 0])]; tensor cache_29_end_0 = const()[name = tensor("cache_29_end_0"), val = tensor([8, 1, 70, 512])]; tensor cache_29_end_mask_0 = const()[name = tensor("cache_29_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_29_squeeze_mask_0 = const()[name = tensor("cache_29_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_29_cast_fp16 = slice_by_index(begin = cache_29_begin_0, end = cache_29_end_0, end_mask = cache_29_end_mask_0, squeeze_mask = cache_29_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_29_cast_fp16")]; tensor cache_31_begin_0 = const()[name = tensor("cache_31_begin_0"), val = tensor([7, 0, 0, 0])]; tensor cache_31_end_0 = const()[name = tensor("cache_31_end_0"), val = tensor([8, 1, 512, 8])]; tensor cache_31_end_mask_0 = const()[name = tensor("cache_31_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_31_squeeze_mask_0 = const()[name = tensor("cache_31_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_31_cast_fp16 = slice_by_index(begin = cache_31_begin_0, end = cache_31_end_0, end_mask = cache_31_end_mask_0, squeeze_mask = cache_31_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_31_cast_fp16")]; tensor input_391_axes_0 = const()[name = tensor("input_391_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90368576)))]; tensor encoder_layers_7_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90369664)))]; tensor input_391_cast_fp16 = layer_norm(axes = input_391_axes_0, beta = encoder_layers_7_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_norm_feed_forward1_weight_to_fp16, x = input_389_cast_fp16)[name = tensor("input_391_cast_fp16")]; tensor encoder_layers_7_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(90370752)))]; tensor linear_64_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_7_feed_forward1_linear1_weight_to_fp16, x = input_391_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor input_395_cast_fp16 = silu(x = linear_64_cast_fp16)[name = tensor("input_395_cast_fp16")]; tensor encoder_layers_7_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92467968)))]; tensor linear_65_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_feed_forward1_linear2_weight_to_fp16, x = input_395_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor var_1752_to_fp16 = const()[name = tensor("op_1752_to_fp16"), val = tensor(0x1p-1)]; tensor var_1753_cast_fp16 = mul(x = linear_65_cast_fp16, y = var_1752_to_fp16)[name = tensor("op_1753_cast_fp16")]; tensor input_401_cast_fp16 = add(x = input_389_cast_fp16, y = var_1753_cast_fp16)[name = tensor("input_401_cast_fp16")]; tensor key_15_axes_0 = const()[name = tensor("key_15_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94565184)))]; tensor encoder_layers_7_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94566272)))]; tensor key_15_cast_fp16 = layer_norm(axes = key_15_axes_0, beta = encoder_layers_7_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_norm_self_att_weight_to_fp16, x = input_401_cast_fp16)[name = tensor("key_15_cast_fp16")]; tensor input_403_interleave_0 = const()[name = tensor("input_403_interleave_0"), val = tensor(false)]; tensor input_403_cast_fp16 = concat(axis = var_64, interleave = input_403_interleave_0, values = (cache_29_cast_fp16, key_15_cast_fp16))[name = tensor("input_403_cast_fp16")]; tensor var_1775_begin_0 = const()[name = tensor("op_1775_begin_0"), val = tensor([0, 1, 0])]; tensor var_1775_end_0 = const()[name = tensor("op_1775_end_0"), val = tensor([1, 70, 512])]; tensor var_1775_end_mask_0 = const()[name = tensor("op_1775_end_mask_0"), val = tensor([true, true, true])]; tensor var_1775_cast_fp16 = slice_by_index(begin = var_1775_begin_0, end = var_1775_end_0, end_mask = var_1775_end_mask_0, x = cache_29_cast_fp16)[name = tensor("op_1775_cast_fp16")]; tensor var_1778_begin_0 = const()[name = tensor("op_1778_begin_0"), val = tensor([0, 0, 0])]; tensor var_1778_end_0 = const()[name = tensor("op_1778_end_0"), val = tensor([1, 1, 512])]; tensor var_1778_end_mask_0 = const()[name = tensor("op_1778_end_mask_0"), val = tensor([true, false, true])]; tensor var_1778_cast_fp16 = slice_by_index(begin = var_1778_begin_0, end = var_1778_end_0, end_mask = var_1778_end_mask_0, x = key_15_cast_fp16)[name = tensor("op_1778_cast_fp16")]; tensor var_1781_interleave_0 = const()[name = tensor("op_1781_interleave_0"), val = tensor(false)]; tensor var_1781_cast_fp16 = concat(axis = var_64, interleave = var_1781_interleave_0, values = (var_1775_cast_fp16, var_1778_cast_fp16))[name = tensor("op_1781_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(94567360)))]; tensor linear_66_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_self_attn_linear_q_weight_to_fp16, x = key_15_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor var_1785 = const()[name = tensor("op_1785"), val = tensor([1, -1, 8, 64])]; tensor q_43_cast_fp16 = reshape(shape = var_1785, x = linear_66_cast_fp16)[name = tensor("q_43_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95091712)))]; tensor linear_67_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_self_attn_linear_k_weight_to_fp16, x = input_403_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor var_1789 = const()[name = tensor("op_1789"), val = tensor([1, -1, 8, 64])]; tensor k_29_cast_fp16 = reshape(shape = var_1789, x = linear_67_cast_fp16)[name = tensor("k_29_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95616064)))]; tensor linear_68_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_self_attn_linear_v_weight_to_fp16, x = input_403_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor var_1793 = const()[name = tensor("op_1793"), val = tensor([1, -1, 8, 64])]; tensor v_15_cast_fp16 = reshape(shape = var_1793, x = linear_68_cast_fp16)[name = tensor("v_15_cast_fp16")]; tensor value_17_perm_0 = const()[name = tensor("value_17_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_7_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96140416)))]; tensor var_1805_cast_fp16 = add(x = q_43_cast_fp16, y = encoder_layers_7_self_attn_pos_bias_u_to_fp16)[name = tensor("op_1805_cast_fp16")]; tensor encoder_layers_7_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96141504)))]; tensor var_1807_cast_fp16 = add(x = q_43_cast_fp16, y = encoder_layers_7_self_attn_pos_bias_v_to_fp16)[name = tensor("op_1807_cast_fp16")]; tensor q_with_bias_v_15_perm_0 = const()[name = tensor("q_with_bias_v_15_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_189_transpose_x_0 = const()[name = tensor("x_189_transpose_x_0"), val = tensor(false)]; tensor x_189_transpose_y_0 = const()[name = tensor("x_189_transpose_y_0"), val = tensor(false)]; tensor var_1809_to_fp16 = const()[name = tensor("op_1809_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96142592)))]; tensor q_with_bias_v_15_cast_fp16 = transpose(perm = q_with_bias_v_15_perm_0, x = var_1807_cast_fp16)[name = tensor("transpose_174")]; tensor x_189_cast_fp16 = matmul(transpose_x = x_189_transpose_x_0, transpose_y = x_189_transpose_y_0, x = q_with_bias_v_15_cast_fp16, y = var_1809_to_fp16)[name = tensor("x_189_cast_fp16")]; tensor x_191_pad_0 = const()[name = tensor("x_191_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_191_mode_0 = const()[name = tensor("x_191_mode_0"), val = tensor("constant")]; tensor const_114_to_fp16 = const()[name = tensor("const_114_to_fp16"), val = tensor(0x0p+0)]; tensor x_191_cast_fp16 = pad(constant_val = const_114_to_fp16, mode = x_191_mode_0, pad = x_191_pad_0, x = x_189_cast_fp16)[name = tensor("x_191_cast_fp16")]; tensor var_1817 = const()[name = tensor("op_1817"), val = tensor([1, 8, -1, 3])]; tensor x_193_cast_fp16 = reshape(shape = var_1817, x = x_191_cast_fp16)[name = tensor("x_193_cast_fp16")]; tensor var_1821_begin_0 = const()[name = tensor("op_1821_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_1821_end_0 = const()[name = tensor("op_1821_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_1821_end_mask_0 = const()[name = tensor("op_1821_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_1821_cast_fp16 = slice_by_index(begin = var_1821_begin_0, end = var_1821_end_0, end_mask = var_1821_end_mask_0, x = x_193_cast_fp16)[name = tensor("op_1821_cast_fp16")]; tensor var_1822 = const()[name = tensor("op_1822"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_29_cast_fp16 = reshape(shape = var_1822, x = var_1821_cast_fp16)[name = tensor("matrix_bd_29_cast_fp16")]; tensor matrix_ac_15_transpose_x_0 = const()[name = tensor("matrix_ac_15_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_15_transpose_y_0 = const()[name = tensor("matrix_ac_15_transpose_y_0"), val = tensor(false)]; tensor transpose_65_perm_0 = const()[name = tensor("transpose_65_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_66_perm_0 = const()[name = tensor("transpose_66_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_66 = transpose(perm = transpose_66_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_172")]; tensor transpose_65 = transpose(perm = transpose_65_perm_0, x = var_1805_cast_fp16)[name = tensor("transpose_173")]; tensor matrix_ac_15_cast_fp16 = matmul(transpose_x = matrix_ac_15_transpose_x_0, transpose_y = matrix_ac_15_transpose_y_0, x = transpose_65, y = transpose_66)[name = tensor("matrix_ac_15_cast_fp16")]; tensor matrix_bd_31_begin_0 = const()[name = tensor("matrix_bd_31_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_31_end_0 = const()[name = tensor("matrix_bd_31_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_31_end_mask_0 = const()[name = tensor("matrix_bd_31_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_31_cast_fp16 = slice_by_index(begin = matrix_bd_31_begin_0, end = matrix_bd_31_end_0, end_mask = matrix_bd_31_end_mask_0, x = matrix_bd_29_cast_fp16)[name = tensor("matrix_bd_31_cast_fp16")]; tensor var_1831_cast_fp16 = add(x = matrix_ac_15_cast_fp16, y = matrix_bd_31_cast_fp16)[name = tensor("op_1831_cast_fp16")]; tensor _inversed_scores_29_y_0_to_fp16 = const()[name = tensor("_inversed_scores_29_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_29_cast_fp16 = mul(x = var_1831_cast_fp16, y = _inversed_scores_29_y_0_to_fp16)[name = tensor("_inversed_scores_29_cast_fp16")]; tensor scores_31_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_29_cast_fp16, cond = mask_3)[name = tensor("scores_31_cast_fp16")]; tensor var_1837_cast_fp16 = softmax(axis = var_62, x = scores_31_cast_fp16)[name = tensor("op_1837_cast_fp16")]; tensor input_405_cast_fp16 = select(a = var_40_to_fp16, b = var_1837_cast_fp16, cond = mask_3)[name = tensor("input_405_cast_fp16")]; tensor x_195_transpose_x_0 = const()[name = tensor("x_195_transpose_x_0"), val = tensor(false)]; tensor x_195_transpose_y_0 = const()[name = tensor("x_195_transpose_y_0"), val = tensor(false)]; tensor value_17_cast_fp16 = transpose(perm = value_17_perm_0, x = v_15_cast_fp16)[name = tensor("transpose_175")]; tensor x_195_cast_fp16 = matmul(transpose_x = x_195_transpose_x_0, transpose_y = x_195_transpose_y_0, x = input_405_cast_fp16, y = value_17_cast_fp16)[name = tensor("x_195_cast_fp16")]; tensor var_1841_perm_0 = const()[name = tensor("op_1841_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_1842 = const()[name = tensor("op_1842"), val = tensor([1, -1, 512])]; tensor var_1841_cast_fp16 = transpose(perm = var_1841_perm_0, x = x_195_cast_fp16)[name = tensor("transpose_171")]; tensor input_407_cast_fp16 = reshape(shape = var_1842, x = var_1841_cast_fp16)[name = tensor("input_407_cast_fp16")]; tensor encoder_layers_7_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_7_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96291136)))]; tensor linear_70_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_self_attn_linear_out_weight_to_fp16, x = input_407_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor input_411_cast_fp16 = add(x = input_401_cast_fp16, y = linear_70_cast_fp16)[name = tensor("input_411_cast_fp16")]; tensor x_199_axes_0 = const()[name = tensor("x_199_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96815488)))]; tensor encoder_layers_7_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96816576)))]; tensor x_199_cast_fp16 = layer_norm(axes = x_199_axes_0, beta = encoder_layers_7_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_norm_conv_weight_to_fp16, x = input_411_cast_fp16)[name = tensor("x_199_cast_fp16")]; tensor input_413_perm_0 = const()[name = tensor("input_413_perm_0"), val = tensor([0, 2, 1])]; tensor input_415_pad_type_0 = const()[name = tensor("input_415_pad_type_0"), val = tensor("valid")]; tensor input_415_strides_0 = const()[name = tensor("input_415_strides_0"), val = tensor([1])]; tensor input_415_pad_0 = const()[name = tensor("input_415_pad_0"), val = tensor([0, 0])]; tensor input_415_dilations_0 = const()[name = tensor("input_415_dilations_0"), val = tensor([1])]; tensor input_415_groups_0 = const()[name = tensor("input_415_groups_0"), val = tensor(1)]; tensor encoder_layers_7_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96817664)))]; tensor input_413_cast_fp16 = transpose(perm = input_413_perm_0, x = x_199_cast_fp16)[name = tensor("transpose_170")]; tensor input_415_cast_fp16 = conv(dilations = input_415_dilations_0, groups = input_415_groups_0, pad = input_415_pad_0, pad_type = input_415_pad_type_0, strides = input_415_strides_0, weight = encoder_layers_7_conv_pointwise_conv1_weight_to_fp16, x = input_413_cast_fp16)[name = tensor("input_415_cast_fp16")]; tensor x_201_split_num_splits_0 = const()[name = tensor("x_201_split_num_splits_0"), val = tensor(2)]; tensor x_201_split_axis_0 = const()[name = tensor("x_201_split_axis_0"), val = tensor(1)]; tensor x_201_split_cast_fp16_0, tensor x_201_split_cast_fp16_1 = split(axis = x_201_split_axis_0, num_splits = x_201_split_num_splits_0, x = input_415_cast_fp16)[name = tensor("x_201_split_cast_fp16")]; tensor x_201_split_1_sigmoid_cast_fp16 = sigmoid(x = x_201_split_cast_fp16_1)[name = tensor("x_201_split_1_sigmoid_cast_fp16")]; tensor x_201_cast_fp16 = mul(x = x_201_split_cast_fp16_0, y = x_201_split_1_sigmoid_cast_fp16)[name = tensor("x_201_cast_fp16")]; tensor input_417_cast_fp16 = select(a = var_40_to_fp16, b = x_201_cast_fp16, cond = var_418)[name = tensor("input_417_cast_fp16")]; tensor new_x_31_interleave_0 = const()[name = tensor("new_x_31_interleave_0"), val = tensor(false)]; tensor new_x_31_cast_fp16 = concat(axis = var_62, interleave = new_x_31_interleave_0, values = (cache_31_cast_fp16, input_417_cast_fp16))[name = tensor("new_x_31_cast_fp16")]; tensor next_cache_15_begin_0 = const()[name = tensor("next_cache_15_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_15_end_0 = const()[name = tensor("next_cache_15_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_15_end_mask_0 = const()[name = tensor("next_cache_15_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_15_cast_fp16 = slice_by_index(begin = next_cache_15_begin_0, end = next_cache_15_end_0, end_mask = next_cache_15_end_mask_0, x = new_x_31_cast_fp16)[name = tensor("next_cache_15_cast_fp16")]; tensor var_1883_begin_0 = const()[name = tensor("op_1883_begin_0"), val = tensor([0, 0, 1])]; tensor var_1883_end_0 = const()[name = tensor("op_1883_end_0"), val = tensor([1, 512, 9])]; tensor var_1883_end_mask_0 = const()[name = tensor("op_1883_end_mask_0"), val = tensor([true, true, true])]; tensor var_1883_cast_fp16 = slice_by_index(begin = var_1883_begin_0, end = var_1883_end_0, end_mask = var_1883_end_mask_0, x = next_cache_15_cast_fp16)[name = tensor("op_1883_cast_fp16")]; tensor x_203_pad_type_0 = const()[name = tensor("x_203_pad_type_0"), val = tensor("valid")]; tensor x_203_groups_0 = const()[name = tensor("x_203_groups_0"), val = tensor(512)]; tensor x_203_strides_0 = const()[name = tensor("x_203_strides_0"), val = tensor([1])]; tensor x_203_pad_0 = const()[name = tensor("x_203_pad_0"), val = tensor([0, 0])]; tensor x_203_dilations_0 = const()[name = tensor("x_203_dilations_0"), val = tensor([1])]; tensor encoder_layers_7_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_7_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97866304)))]; tensor x_203_cast_fp16 = conv(dilations = x_203_dilations_0, groups = x_203_groups_0, pad = x_203_pad_0, pad_type = x_203_pad_type_0, strides = x_203_strides_0, weight = encoder_layers_7_conv_depthwise_conv_weight_to_fp16, x = new_x_31_cast_fp16)[name = tensor("x_203_cast_fp16")]; tensor input_419_perm_0 = const()[name = tensor("input_419_perm_0"), val = tensor([0, 2, 1])]; tensor x_205_axes_0 = const()[name = tensor("x_205_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_7_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97875584)))]; tensor encoder_layers_7_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_7_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97876672)))]; tensor input_419_cast_fp16 = transpose(perm = input_419_perm_0, x = x_203_cast_fp16)[name = tensor("transpose_169")]; tensor x_205_cast_fp16 = layer_norm(axes = x_205_axes_0, beta = encoder_layers_7_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_conv_batch_norm_weight_to_fp16, x = input_419_cast_fp16)[name = tensor("x_205_cast_fp16")]; tensor input_421_perm_0 = const()[name = tensor("input_421_perm_0"), val = tensor([0, 2, 1])]; tensor input_421_cast_fp16 = transpose(perm = input_421_perm_0, x = x_205_cast_fp16)[name = tensor("transpose_168")]; tensor input_423_cast_fp16 = silu(x = input_421_cast_fp16)[name = tensor("input_423_cast_fp16")]; tensor x_207_pad_type_0 = const()[name = tensor("x_207_pad_type_0"), val = tensor("valid")]; tensor x_207_strides_0 = const()[name = tensor("x_207_strides_0"), val = tensor([1])]; tensor x_207_pad_0 = const()[name = tensor("x_207_pad_0"), val = tensor([0, 0])]; tensor x_207_dilations_0 = const()[name = tensor("x_207_dilations_0"), val = tensor([1])]; tensor x_207_groups_0 = const()[name = tensor("x_207_groups_0"), val = tensor(1)]; tensor encoder_layers_7_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(97877760)))]; tensor x_207_cast_fp16 = conv(dilations = x_207_dilations_0, groups = x_207_groups_0, pad = x_207_pad_0, pad_type = x_207_pad_type_0, strides = x_207_strides_0, weight = encoder_layers_7_conv_pointwise_conv2_weight_to_fp16, x = input_423_cast_fp16)[name = tensor("x_207_cast_fp16")]; tensor input_425_perm_0 = const()[name = tensor("input_425_perm_0"), val = tensor([0, 2, 1])]; tensor input_425_cast_fp16 = transpose(perm = input_425_perm_0, x = x_207_cast_fp16)[name = tensor("transpose_167")]; tensor input_427_cast_fp16 = add(x = input_411_cast_fp16, y = input_425_cast_fp16)[name = tensor("input_427_cast_fp16")]; tensor input_429_axes_0 = const()[name = tensor("input_429_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(98402112)))]; tensor encoder_layers_7_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(98403200)))]; tensor input_429_cast_fp16 = layer_norm(axes = input_429_axes_0, beta = encoder_layers_7_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_norm_feed_forward2_weight_to_fp16, x = input_427_cast_fp16)[name = tensor("input_429_cast_fp16")]; tensor encoder_layers_7_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(98404288)))]; tensor linear_71_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_7_feed_forward2_linear1_weight_to_fp16, x = input_429_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor input_433_cast_fp16 = silu(x = linear_71_cast_fp16)[name = tensor("input_433_cast_fp16")]; tensor encoder_layers_7_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_7_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100501504)))]; tensor linear_72_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_7_feed_forward2_linear2_weight_to_fp16, x = input_433_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor var_1924_to_fp16 = const()[name = tensor("op_1924_to_fp16"), val = tensor(0x1p-1)]; tensor var_1925_cast_fp16 = mul(x = linear_72_cast_fp16, y = var_1924_to_fp16)[name = tensor("op_1925_cast_fp16")]; tensor input_439_cast_fp16 = add(x = input_427_cast_fp16, y = var_1925_cast_fp16)[name = tensor("input_439_cast_fp16")]; tensor input_441_axes_0 = const()[name = tensor("input_441_axes_0"), val = tensor([-1])]; tensor encoder_layers_7_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_7_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102598720)))]; tensor encoder_layers_7_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_7_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102599808)))]; tensor input_441_cast_fp16 = layer_norm(axes = input_441_axes_0, beta = encoder_layers_7_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_7_norm_out_weight_to_fp16, x = input_439_cast_fp16)[name = tensor("input_441_cast_fp16")]; tensor cache_33_begin_0 = const()[name = tensor("cache_33_begin_0"), val = tensor([8, 0, 0, 0])]; tensor cache_33_end_0 = const()[name = tensor("cache_33_end_0"), val = tensor([9, 1, 70, 512])]; tensor cache_33_end_mask_0 = const()[name = tensor("cache_33_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_33_squeeze_mask_0 = const()[name = tensor("cache_33_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_33_cast_fp16 = slice_by_index(begin = cache_33_begin_0, end = cache_33_end_0, end_mask = cache_33_end_mask_0, squeeze_mask = cache_33_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_33_cast_fp16")]; tensor cache_35_begin_0 = const()[name = tensor("cache_35_begin_0"), val = tensor([8, 0, 0, 0])]; tensor cache_35_end_0 = const()[name = tensor("cache_35_end_0"), val = tensor([9, 1, 512, 8])]; tensor cache_35_end_mask_0 = const()[name = tensor("cache_35_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_35_squeeze_mask_0 = const()[name = tensor("cache_35_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_35_cast_fp16 = slice_by_index(begin = cache_35_begin_0, end = cache_35_end_0, end_mask = cache_35_end_mask_0, squeeze_mask = cache_35_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_35_cast_fp16")]; tensor input_443_axes_0 = const()[name = tensor("input_443_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102600896)))]; tensor encoder_layers_8_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102601984)))]; tensor input_443_cast_fp16 = layer_norm(axes = input_443_axes_0, beta = encoder_layers_8_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_norm_feed_forward1_weight_to_fp16, x = input_441_cast_fp16)[name = tensor("input_443_cast_fp16")]; tensor encoder_layers_8_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102603072)))]; tensor linear_73_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_8_feed_forward1_linear1_weight_to_fp16, x = input_443_cast_fp16)[name = tensor("linear_73_cast_fp16")]; tensor input_447_cast_fp16 = silu(x = linear_73_cast_fp16)[name = tensor("input_447_cast_fp16")]; tensor encoder_layers_8_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(104700288)))]; tensor linear_74_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_feed_forward1_linear2_weight_to_fp16, x = input_447_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor var_1959_to_fp16 = const()[name = tensor("op_1959_to_fp16"), val = tensor(0x1p-1)]; tensor var_1960_cast_fp16 = mul(x = linear_74_cast_fp16, y = var_1959_to_fp16)[name = tensor("op_1960_cast_fp16")]; tensor input_453_cast_fp16 = add(x = input_441_cast_fp16, y = var_1960_cast_fp16)[name = tensor("input_453_cast_fp16")]; tensor key_17_axes_0 = const()[name = tensor("key_17_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106797504)))]; tensor encoder_layers_8_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106798592)))]; tensor key_17_cast_fp16 = layer_norm(axes = key_17_axes_0, beta = encoder_layers_8_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_norm_self_att_weight_to_fp16, x = input_453_cast_fp16)[name = tensor("key_17_cast_fp16")]; tensor input_455_interleave_0 = const()[name = tensor("input_455_interleave_0"), val = tensor(false)]; tensor input_455_cast_fp16 = concat(axis = var_64, interleave = input_455_interleave_0, values = (cache_33_cast_fp16, key_17_cast_fp16))[name = tensor("input_455_cast_fp16")]; tensor var_1982_begin_0 = const()[name = tensor("op_1982_begin_0"), val = tensor([0, 1, 0])]; tensor var_1982_end_0 = const()[name = tensor("op_1982_end_0"), val = tensor([1, 70, 512])]; tensor var_1982_end_mask_0 = const()[name = tensor("op_1982_end_mask_0"), val = tensor([true, true, true])]; tensor var_1982_cast_fp16 = slice_by_index(begin = var_1982_begin_0, end = var_1982_end_0, end_mask = var_1982_end_mask_0, x = cache_33_cast_fp16)[name = tensor("op_1982_cast_fp16")]; tensor var_1985_begin_0 = const()[name = tensor("op_1985_begin_0"), val = tensor([0, 0, 0])]; tensor var_1985_end_0 = const()[name = tensor("op_1985_end_0"), val = tensor([1, 1, 512])]; tensor var_1985_end_mask_0 = const()[name = tensor("op_1985_end_mask_0"), val = tensor([true, false, true])]; tensor var_1985_cast_fp16 = slice_by_index(begin = var_1985_begin_0, end = var_1985_end_0, end_mask = var_1985_end_mask_0, x = key_17_cast_fp16)[name = tensor("op_1985_cast_fp16")]; tensor var_1988_interleave_0 = const()[name = tensor("op_1988_interleave_0"), val = tensor(false)]; tensor var_1988_cast_fp16 = concat(axis = var_64, interleave = var_1988_interleave_0, values = (var_1982_cast_fp16, var_1985_cast_fp16))[name = tensor("op_1988_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106799680)))]; tensor linear_75_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_self_attn_linear_q_weight_to_fp16, x = key_17_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor var_1992 = const()[name = tensor("op_1992"), val = tensor([1, -1, 8, 64])]; tensor q_49_cast_fp16 = reshape(shape = var_1992, x = linear_75_cast_fp16)[name = tensor("q_49_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107324032)))]; tensor linear_76_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_self_attn_linear_k_weight_to_fp16, x = input_455_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor var_1996 = const()[name = tensor("op_1996"), val = tensor([1, -1, 8, 64])]; tensor k_33_cast_fp16 = reshape(shape = var_1996, x = linear_76_cast_fp16)[name = tensor("k_33_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(107848384)))]; tensor linear_77_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_self_attn_linear_v_weight_to_fp16, x = input_455_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor var_2000 = const()[name = tensor("op_2000"), val = tensor([1, -1, 8, 64])]; tensor v_17_cast_fp16 = reshape(shape = var_2000, x = linear_77_cast_fp16)[name = tensor("v_17_cast_fp16")]; tensor value_19_perm_0 = const()[name = tensor("value_19_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_8_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108372736)))]; tensor var_2012_cast_fp16 = add(x = q_49_cast_fp16, y = encoder_layers_8_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2012_cast_fp16")]; tensor encoder_layers_8_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108373824)))]; tensor var_2014_cast_fp16 = add(x = q_49_cast_fp16, y = encoder_layers_8_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2014_cast_fp16")]; tensor q_with_bias_v_17_perm_0 = const()[name = tensor("q_with_bias_v_17_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_215_transpose_x_0 = const()[name = tensor("x_215_transpose_x_0"), val = tensor(false)]; tensor x_215_transpose_y_0 = const()[name = tensor("x_215_transpose_y_0"), val = tensor(false)]; tensor var_2016_to_fp16 = const()[name = tensor("op_2016_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108374912)))]; tensor q_with_bias_v_17_cast_fp16 = transpose(perm = q_with_bias_v_17_perm_0, x = var_2014_cast_fp16)[name = tensor("transpose_165")]; tensor x_215_cast_fp16 = matmul(transpose_x = x_215_transpose_x_0, transpose_y = x_215_transpose_y_0, x = q_with_bias_v_17_cast_fp16, y = var_2016_to_fp16)[name = tensor("x_215_cast_fp16")]; tensor x_217_pad_0 = const()[name = tensor("x_217_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_217_mode_0 = const()[name = tensor("x_217_mode_0"), val = tensor("constant")]; tensor const_127_to_fp16 = const()[name = tensor("const_127_to_fp16"), val = tensor(0x0p+0)]; tensor x_217_cast_fp16 = pad(constant_val = const_127_to_fp16, mode = x_217_mode_0, pad = x_217_pad_0, x = x_215_cast_fp16)[name = tensor("x_217_cast_fp16")]; tensor var_2024 = const()[name = tensor("op_2024"), val = tensor([1, 8, -1, 3])]; tensor x_219_cast_fp16 = reshape(shape = var_2024, x = x_217_cast_fp16)[name = tensor("x_219_cast_fp16")]; tensor var_2028_begin_0 = const()[name = tensor("op_2028_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2028_end_0 = const()[name = tensor("op_2028_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_2028_end_mask_0 = const()[name = tensor("op_2028_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2028_cast_fp16 = slice_by_index(begin = var_2028_begin_0, end = var_2028_end_0, end_mask = var_2028_end_mask_0, x = x_219_cast_fp16)[name = tensor("op_2028_cast_fp16")]; tensor var_2029 = const()[name = tensor("op_2029"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_33_cast_fp16 = reshape(shape = var_2029, x = var_2028_cast_fp16)[name = tensor("matrix_bd_33_cast_fp16")]; tensor matrix_ac_17_transpose_x_0 = const()[name = tensor("matrix_ac_17_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_17_transpose_y_0 = const()[name = tensor("matrix_ac_17_transpose_y_0"), val = tensor(false)]; tensor transpose_67_perm_0 = const()[name = tensor("transpose_67_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_68_perm_0 = const()[name = tensor("transpose_68_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_68 = transpose(perm = transpose_68_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_163")]; tensor transpose_67 = transpose(perm = transpose_67_perm_0, x = var_2012_cast_fp16)[name = tensor("transpose_164")]; tensor matrix_ac_17_cast_fp16 = matmul(transpose_x = matrix_ac_17_transpose_x_0, transpose_y = matrix_ac_17_transpose_y_0, x = transpose_67, y = transpose_68)[name = tensor("matrix_ac_17_cast_fp16")]; tensor matrix_bd_35_begin_0 = const()[name = tensor("matrix_bd_35_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_35_end_0 = const()[name = tensor("matrix_bd_35_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_35_end_mask_0 = const()[name = tensor("matrix_bd_35_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_35_cast_fp16 = slice_by_index(begin = matrix_bd_35_begin_0, end = matrix_bd_35_end_0, end_mask = matrix_bd_35_end_mask_0, x = matrix_bd_33_cast_fp16)[name = tensor("matrix_bd_35_cast_fp16")]; tensor var_2038_cast_fp16 = add(x = matrix_ac_17_cast_fp16, y = matrix_bd_35_cast_fp16)[name = tensor("op_2038_cast_fp16")]; tensor _inversed_scores_33_y_0_to_fp16 = const()[name = tensor("_inversed_scores_33_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_33_cast_fp16 = mul(x = var_2038_cast_fp16, y = _inversed_scores_33_y_0_to_fp16)[name = tensor("_inversed_scores_33_cast_fp16")]; tensor scores_35_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_33_cast_fp16, cond = mask_3)[name = tensor("scores_35_cast_fp16")]; tensor var_2044_cast_fp16 = softmax(axis = var_62, x = scores_35_cast_fp16)[name = tensor("op_2044_cast_fp16")]; tensor input_457_cast_fp16 = select(a = var_40_to_fp16, b = var_2044_cast_fp16, cond = mask_3)[name = tensor("input_457_cast_fp16")]; tensor x_221_transpose_x_0 = const()[name = tensor("x_221_transpose_x_0"), val = tensor(false)]; tensor x_221_transpose_y_0 = const()[name = tensor("x_221_transpose_y_0"), val = tensor(false)]; tensor value_19_cast_fp16 = transpose(perm = value_19_perm_0, x = v_17_cast_fp16)[name = tensor("transpose_166")]; tensor x_221_cast_fp16 = matmul(transpose_x = x_221_transpose_x_0, transpose_y = x_221_transpose_y_0, x = input_457_cast_fp16, y = value_19_cast_fp16)[name = tensor("x_221_cast_fp16")]; tensor var_2048_perm_0 = const()[name = tensor("op_2048_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2049 = const()[name = tensor("op_2049"), val = tensor([1, -1, 512])]; tensor var_2048_cast_fp16 = transpose(perm = var_2048_perm_0, x = x_221_cast_fp16)[name = tensor("transpose_162")]; tensor input_459_cast_fp16 = reshape(shape = var_2049, x = var_2048_cast_fp16)[name = tensor("input_459_cast_fp16")]; tensor encoder_layers_8_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_8_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(108523456)))]; tensor linear_79_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_self_attn_linear_out_weight_to_fp16, x = input_459_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor input_463_cast_fp16 = add(x = input_453_cast_fp16, y = linear_79_cast_fp16)[name = tensor("input_463_cast_fp16")]; tensor x_225_axes_0 = const()[name = tensor("x_225_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109047808)))]; tensor encoder_layers_8_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109048896)))]; tensor x_225_cast_fp16 = layer_norm(axes = x_225_axes_0, beta = encoder_layers_8_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_norm_conv_weight_to_fp16, x = input_463_cast_fp16)[name = tensor("x_225_cast_fp16")]; tensor input_465_perm_0 = const()[name = tensor("input_465_perm_0"), val = tensor([0, 2, 1])]; tensor input_467_pad_type_0 = const()[name = tensor("input_467_pad_type_0"), val = tensor("valid")]; tensor input_467_strides_0 = const()[name = tensor("input_467_strides_0"), val = tensor([1])]; tensor input_467_pad_0 = const()[name = tensor("input_467_pad_0"), val = tensor([0, 0])]; tensor input_467_dilations_0 = const()[name = tensor("input_467_dilations_0"), val = tensor([1])]; tensor input_467_groups_0 = const()[name = tensor("input_467_groups_0"), val = tensor(1)]; tensor encoder_layers_8_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(109049984)))]; tensor input_465_cast_fp16 = transpose(perm = input_465_perm_0, x = x_225_cast_fp16)[name = tensor("transpose_161")]; tensor input_467_cast_fp16 = conv(dilations = input_467_dilations_0, groups = input_467_groups_0, pad = input_467_pad_0, pad_type = input_467_pad_type_0, strides = input_467_strides_0, weight = encoder_layers_8_conv_pointwise_conv1_weight_to_fp16, x = input_465_cast_fp16)[name = tensor("input_467_cast_fp16")]; tensor x_227_split_num_splits_0 = const()[name = tensor("x_227_split_num_splits_0"), val = tensor(2)]; tensor x_227_split_axis_0 = const()[name = tensor("x_227_split_axis_0"), val = tensor(1)]; tensor x_227_split_cast_fp16_0, tensor x_227_split_cast_fp16_1 = split(axis = x_227_split_axis_0, num_splits = x_227_split_num_splits_0, x = input_467_cast_fp16)[name = tensor("x_227_split_cast_fp16")]; tensor x_227_split_1_sigmoid_cast_fp16 = sigmoid(x = x_227_split_cast_fp16_1)[name = tensor("x_227_split_1_sigmoid_cast_fp16")]; tensor x_227_cast_fp16 = mul(x = x_227_split_cast_fp16_0, y = x_227_split_1_sigmoid_cast_fp16)[name = tensor("x_227_cast_fp16")]; tensor input_469_cast_fp16 = select(a = var_40_to_fp16, b = x_227_cast_fp16, cond = var_418)[name = tensor("input_469_cast_fp16")]; tensor new_x_35_interleave_0 = const()[name = tensor("new_x_35_interleave_0"), val = tensor(false)]; tensor new_x_35_cast_fp16 = concat(axis = var_62, interleave = new_x_35_interleave_0, values = (cache_35_cast_fp16, input_469_cast_fp16))[name = tensor("new_x_35_cast_fp16")]; tensor next_cache_17_begin_0 = const()[name = tensor("next_cache_17_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_17_end_0 = const()[name = tensor("next_cache_17_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_17_end_mask_0 = const()[name = tensor("next_cache_17_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_17_cast_fp16 = slice_by_index(begin = next_cache_17_begin_0, end = next_cache_17_end_0, end_mask = next_cache_17_end_mask_0, x = new_x_35_cast_fp16)[name = tensor("next_cache_17_cast_fp16")]; tensor var_2090_begin_0 = const()[name = tensor("op_2090_begin_0"), val = tensor([0, 0, 1])]; tensor var_2090_end_0 = const()[name = tensor("op_2090_end_0"), val = tensor([1, 512, 9])]; tensor var_2090_end_mask_0 = const()[name = tensor("op_2090_end_mask_0"), val = tensor([true, true, true])]; tensor var_2090_cast_fp16 = slice_by_index(begin = var_2090_begin_0, end = var_2090_end_0, end_mask = var_2090_end_mask_0, x = next_cache_17_cast_fp16)[name = tensor("op_2090_cast_fp16")]; tensor x_229_pad_type_0 = const()[name = tensor("x_229_pad_type_0"), val = tensor("valid")]; tensor x_229_groups_0 = const()[name = tensor("x_229_groups_0"), val = tensor(512)]; tensor x_229_strides_0 = const()[name = tensor("x_229_strides_0"), val = tensor([1])]; tensor x_229_pad_0 = const()[name = tensor("x_229_pad_0"), val = tensor([0, 0])]; tensor x_229_dilations_0 = const()[name = tensor("x_229_dilations_0"), val = tensor([1])]; tensor encoder_layers_8_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_8_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110098624)))]; tensor x_229_cast_fp16 = conv(dilations = x_229_dilations_0, groups = x_229_groups_0, pad = x_229_pad_0, pad_type = x_229_pad_type_0, strides = x_229_strides_0, weight = encoder_layers_8_conv_depthwise_conv_weight_to_fp16, x = new_x_35_cast_fp16)[name = tensor("x_229_cast_fp16")]; tensor input_471_perm_0 = const()[name = tensor("input_471_perm_0"), val = tensor([0, 2, 1])]; tensor x_231_axes_0 = const()[name = tensor("x_231_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_8_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110107904)))]; tensor encoder_layers_8_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_8_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110108992)))]; tensor input_471_cast_fp16 = transpose(perm = input_471_perm_0, x = x_229_cast_fp16)[name = tensor("transpose_160")]; tensor x_231_cast_fp16 = layer_norm(axes = x_231_axes_0, beta = encoder_layers_8_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_conv_batch_norm_weight_to_fp16, x = input_471_cast_fp16)[name = tensor("x_231_cast_fp16")]; tensor input_473_perm_0 = const()[name = tensor("input_473_perm_0"), val = tensor([0, 2, 1])]; tensor input_473_cast_fp16 = transpose(perm = input_473_perm_0, x = x_231_cast_fp16)[name = tensor("transpose_159")]; tensor input_475_cast_fp16 = silu(x = input_473_cast_fp16)[name = tensor("input_475_cast_fp16")]; tensor x_233_pad_type_0 = const()[name = tensor("x_233_pad_type_0"), val = tensor("valid")]; tensor x_233_strides_0 = const()[name = tensor("x_233_strides_0"), val = tensor([1])]; tensor x_233_pad_0 = const()[name = tensor("x_233_pad_0"), val = tensor([0, 0])]; tensor x_233_dilations_0 = const()[name = tensor("x_233_dilations_0"), val = tensor([1])]; tensor x_233_groups_0 = const()[name = tensor("x_233_groups_0"), val = tensor(1)]; tensor encoder_layers_8_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110110080)))]; tensor x_233_cast_fp16 = conv(dilations = x_233_dilations_0, groups = x_233_groups_0, pad = x_233_pad_0, pad_type = x_233_pad_type_0, strides = x_233_strides_0, weight = encoder_layers_8_conv_pointwise_conv2_weight_to_fp16, x = input_475_cast_fp16)[name = tensor("x_233_cast_fp16")]; tensor input_477_perm_0 = const()[name = tensor("input_477_perm_0"), val = tensor([0, 2, 1])]; tensor input_477_cast_fp16 = transpose(perm = input_477_perm_0, x = x_233_cast_fp16)[name = tensor("transpose_158")]; tensor input_479_cast_fp16 = add(x = input_463_cast_fp16, y = input_477_cast_fp16)[name = tensor("input_479_cast_fp16")]; tensor input_481_axes_0 = const()[name = tensor("input_481_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110634432)))]; tensor encoder_layers_8_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110635520)))]; tensor input_481_cast_fp16 = layer_norm(axes = input_481_axes_0, beta = encoder_layers_8_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_norm_feed_forward2_weight_to_fp16, x = input_479_cast_fp16)[name = tensor("input_481_cast_fp16")]; tensor encoder_layers_8_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110636608)))]; tensor linear_80_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_8_feed_forward2_linear1_weight_to_fp16, x = input_481_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor input_485_cast_fp16 = silu(x = linear_80_cast_fp16)[name = tensor("input_485_cast_fp16")]; tensor encoder_layers_8_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_8_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(112733824)))]; tensor linear_81_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_8_feed_forward2_linear2_weight_to_fp16, x = input_485_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor var_2131_to_fp16 = const()[name = tensor("op_2131_to_fp16"), val = tensor(0x1p-1)]; tensor var_2132_cast_fp16 = mul(x = linear_81_cast_fp16, y = var_2131_to_fp16)[name = tensor("op_2132_cast_fp16")]; tensor input_491_cast_fp16 = add(x = input_479_cast_fp16, y = var_2132_cast_fp16)[name = tensor("input_491_cast_fp16")]; tensor input_493_axes_0 = const()[name = tensor("input_493_axes_0"), val = tensor([-1])]; tensor encoder_layers_8_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_8_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114831040)))]; tensor encoder_layers_8_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_8_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114832128)))]; tensor input_493_cast_fp16 = layer_norm(axes = input_493_axes_0, beta = encoder_layers_8_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_8_norm_out_weight_to_fp16, x = input_491_cast_fp16)[name = tensor("input_493_cast_fp16")]; tensor cache_37_begin_0 = const()[name = tensor("cache_37_begin_0"), val = tensor([9, 0, 0, 0])]; tensor cache_37_end_0 = const()[name = tensor("cache_37_end_0"), val = tensor([10, 1, 70, 512])]; tensor cache_37_end_mask_0 = const()[name = tensor("cache_37_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_37_squeeze_mask_0 = const()[name = tensor("cache_37_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_37_cast_fp16 = slice_by_index(begin = cache_37_begin_0, end = cache_37_end_0, end_mask = cache_37_end_mask_0, squeeze_mask = cache_37_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_37_cast_fp16")]; tensor cache_39_begin_0 = const()[name = tensor("cache_39_begin_0"), val = tensor([9, 0, 0, 0])]; tensor cache_39_end_0 = const()[name = tensor("cache_39_end_0"), val = tensor([10, 1, 512, 8])]; tensor cache_39_end_mask_0 = const()[name = tensor("cache_39_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_39_squeeze_mask_0 = const()[name = tensor("cache_39_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_39_cast_fp16 = slice_by_index(begin = cache_39_begin_0, end = cache_39_end_0, end_mask = cache_39_end_mask_0, squeeze_mask = cache_39_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_39_cast_fp16")]; tensor input_495_axes_0 = const()[name = tensor("input_495_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114833216)))]; tensor encoder_layers_9_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114834304)))]; tensor input_495_cast_fp16 = layer_norm(axes = input_495_axes_0, beta = encoder_layers_9_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_norm_feed_forward1_weight_to_fp16, x = input_493_cast_fp16)[name = tensor("input_495_cast_fp16")]; tensor encoder_layers_9_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114835392)))]; tensor linear_82_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_9_feed_forward1_linear1_weight_to_fp16, x = input_495_cast_fp16)[name = tensor("linear_82_cast_fp16")]; tensor input_499_cast_fp16 = silu(x = linear_82_cast_fp16)[name = tensor("input_499_cast_fp16")]; tensor encoder_layers_9_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116932608)))]; tensor linear_83_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_feed_forward1_linear2_weight_to_fp16, x = input_499_cast_fp16)[name = tensor("linear_83_cast_fp16")]; tensor var_2166_to_fp16 = const()[name = tensor("op_2166_to_fp16"), val = tensor(0x1p-1)]; tensor var_2167_cast_fp16 = mul(x = linear_83_cast_fp16, y = var_2166_to_fp16)[name = tensor("op_2167_cast_fp16")]; tensor input_505_cast_fp16 = add(x = input_493_cast_fp16, y = var_2167_cast_fp16)[name = tensor("input_505_cast_fp16")]; tensor key_19_axes_0 = const()[name = tensor("key_19_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119029824)))]; tensor encoder_layers_9_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119030912)))]; tensor key_19_cast_fp16 = layer_norm(axes = key_19_axes_0, beta = encoder_layers_9_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_norm_self_att_weight_to_fp16, x = input_505_cast_fp16)[name = tensor("key_19_cast_fp16")]; tensor input_507_interleave_0 = const()[name = tensor("input_507_interleave_0"), val = tensor(false)]; tensor input_507_cast_fp16 = concat(axis = var_64, interleave = input_507_interleave_0, values = (cache_37_cast_fp16, key_19_cast_fp16))[name = tensor("input_507_cast_fp16")]; tensor var_2189_begin_0 = const()[name = tensor("op_2189_begin_0"), val = tensor([0, 1, 0])]; tensor var_2189_end_0 = const()[name = tensor("op_2189_end_0"), val = tensor([1, 70, 512])]; tensor var_2189_end_mask_0 = const()[name = tensor("op_2189_end_mask_0"), val = tensor([true, true, true])]; tensor var_2189_cast_fp16 = slice_by_index(begin = var_2189_begin_0, end = var_2189_end_0, end_mask = var_2189_end_mask_0, x = cache_37_cast_fp16)[name = tensor("op_2189_cast_fp16")]; tensor var_2192_begin_0 = const()[name = tensor("op_2192_begin_0"), val = tensor([0, 0, 0])]; tensor var_2192_end_0 = const()[name = tensor("op_2192_end_0"), val = tensor([1, 1, 512])]; tensor var_2192_end_mask_0 = const()[name = tensor("op_2192_end_mask_0"), val = tensor([true, false, true])]; tensor var_2192_cast_fp16 = slice_by_index(begin = var_2192_begin_0, end = var_2192_end_0, end_mask = var_2192_end_mask_0, x = key_19_cast_fp16)[name = tensor("op_2192_cast_fp16")]; tensor var_2195_interleave_0 = const()[name = tensor("op_2195_interleave_0"), val = tensor(false)]; tensor var_2195_cast_fp16 = concat(axis = var_64, interleave = var_2195_interleave_0, values = (var_2189_cast_fp16, var_2192_cast_fp16))[name = tensor("op_2195_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119032000)))]; tensor linear_84_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_self_attn_linear_q_weight_to_fp16, x = key_19_cast_fp16)[name = tensor("linear_84_cast_fp16")]; tensor var_2199 = const()[name = tensor("op_2199"), val = tensor([1, -1, 8, 64])]; tensor q_55_cast_fp16 = reshape(shape = var_2199, x = linear_84_cast_fp16)[name = tensor("q_55_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119556352)))]; tensor linear_85_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_self_attn_linear_k_weight_to_fp16, x = input_507_cast_fp16)[name = tensor("linear_85_cast_fp16")]; tensor var_2203 = const()[name = tensor("op_2203"), val = tensor([1, -1, 8, 64])]; tensor k_37_cast_fp16 = reshape(shape = var_2203, x = linear_85_cast_fp16)[name = tensor("k_37_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120080704)))]; tensor linear_86_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_self_attn_linear_v_weight_to_fp16, x = input_507_cast_fp16)[name = tensor("linear_86_cast_fp16")]; tensor var_2207 = const()[name = tensor("op_2207"), val = tensor([1, -1, 8, 64])]; tensor v_19_cast_fp16 = reshape(shape = var_2207, x = linear_86_cast_fp16)[name = tensor("v_19_cast_fp16")]; tensor value_21_perm_0 = const()[name = tensor("value_21_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_9_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120605056)))]; tensor var_2219_cast_fp16 = add(x = q_55_cast_fp16, y = encoder_layers_9_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2219_cast_fp16")]; tensor encoder_layers_9_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120606144)))]; tensor var_2221_cast_fp16 = add(x = q_55_cast_fp16, y = encoder_layers_9_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2221_cast_fp16")]; tensor q_with_bias_v_19_perm_0 = const()[name = tensor("q_with_bias_v_19_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_241_transpose_x_0 = const()[name = tensor("x_241_transpose_x_0"), val = tensor(false)]; tensor x_241_transpose_y_0 = const()[name = tensor("x_241_transpose_y_0"), val = tensor(false)]; tensor var_2223_to_fp16 = const()[name = tensor("op_2223_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120607232)))]; tensor q_with_bias_v_19_cast_fp16 = transpose(perm = q_with_bias_v_19_perm_0, x = var_2221_cast_fp16)[name = tensor("transpose_156")]; tensor x_241_cast_fp16 = matmul(transpose_x = x_241_transpose_x_0, transpose_y = x_241_transpose_y_0, x = q_with_bias_v_19_cast_fp16, y = var_2223_to_fp16)[name = tensor("x_241_cast_fp16")]; tensor x_243_pad_0 = const()[name = tensor("x_243_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_243_mode_0 = const()[name = tensor("x_243_mode_0"), val = tensor("constant")]; tensor const_140_to_fp16 = const()[name = tensor("const_140_to_fp16"), val = tensor(0x0p+0)]; tensor x_243_cast_fp16 = pad(constant_val = const_140_to_fp16, mode = x_243_mode_0, pad = x_243_pad_0, x = x_241_cast_fp16)[name = tensor("x_243_cast_fp16")]; tensor var_2231 = const()[name = tensor("op_2231"), val = tensor([1, 8, -1, 3])]; tensor x_245_cast_fp16 = reshape(shape = var_2231, x = x_243_cast_fp16)[name = tensor("x_245_cast_fp16")]; tensor var_2235_begin_0 = const()[name = tensor("op_2235_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2235_end_0 = const()[name = tensor("op_2235_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_2235_end_mask_0 = const()[name = tensor("op_2235_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2235_cast_fp16 = slice_by_index(begin = var_2235_begin_0, end = var_2235_end_0, end_mask = var_2235_end_mask_0, x = x_245_cast_fp16)[name = tensor("op_2235_cast_fp16")]; tensor var_2236 = const()[name = tensor("op_2236"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_37_cast_fp16 = reshape(shape = var_2236, x = var_2235_cast_fp16)[name = tensor("matrix_bd_37_cast_fp16")]; tensor matrix_ac_19_transpose_x_0 = const()[name = tensor("matrix_ac_19_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_19_transpose_y_0 = const()[name = tensor("matrix_ac_19_transpose_y_0"), val = tensor(false)]; tensor transpose_69_perm_0 = const()[name = tensor("transpose_69_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_70_perm_0 = const()[name = tensor("transpose_70_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_70 = transpose(perm = transpose_70_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_154")]; tensor transpose_69 = transpose(perm = transpose_69_perm_0, x = var_2219_cast_fp16)[name = tensor("transpose_155")]; tensor matrix_ac_19_cast_fp16 = matmul(transpose_x = matrix_ac_19_transpose_x_0, transpose_y = matrix_ac_19_transpose_y_0, x = transpose_69, y = transpose_70)[name = tensor("matrix_ac_19_cast_fp16")]; tensor matrix_bd_39_begin_0 = const()[name = tensor("matrix_bd_39_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_39_end_0 = const()[name = tensor("matrix_bd_39_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_39_end_mask_0 = const()[name = tensor("matrix_bd_39_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_39_cast_fp16 = slice_by_index(begin = matrix_bd_39_begin_0, end = matrix_bd_39_end_0, end_mask = matrix_bd_39_end_mask_0, x = matrix_bd_37_cast_fp16)[name = tensor("matrix_bd_39_cast_fp16")]; tensor var_2245_cast_fp16 = add(x = matrix_ac_19_cast_fp16, y = matrix_bd_39_cast_fp16)[name = tensor("op_2245_cast_fp16")]; tensor _inversed_scores_37_y_0_to_fp16 = const()[name = tensor("_inversed_scores_37_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_37_cast_fp16 = mul(x = var_2245_cast_fp16, y = _inversed_scores_37_y_0_to_fp16)[name = tensor("_inversed_scores_37_cast_fp16")]; tensor scores_39_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_37_cast_fp16, cond = mask_3)[name = tensor("scores_39_cast_fp16")]; tensor var_2251_cast_fp16 = softmax(axis = var_62, x = scores_39_cast_fp16)[name = tensor("op_2251_cast_fp16")]; tensor input_509_cast_fp16 = select(a = var_40_to_fp16, b = var_2251_cast_fp16, cond = mask_3)[name = tensor("input_509_cast_fp16")]; tensor x_247_transpose_x_0 = const()[name = tensor("x_247_transpose_x_0"), val = tensor(false)]; tensor x_247_transpose_y_0 = const()[name = tensor("x_247_transpose_y_0"), val = tensor(false)]; tensor value_21_cast_fp16 = transpose(perm = value_21_perm_0, x = v_19_cast_fp16)[name = tensor("transpose_157")]; tensor x_247_cast_fp16 = matmul(transpose_x = x_247_transpose_x_0, transpose_y = x_247_transpose_y_0, x = input_509_cast_fp16, y = value_21_cast_fp16)[name = tensor("x_247_cast_fp16")]; tensor var_2255_perm_0 = const()[name = tensor("op_2255_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2256 = const()[name = tensor("op_2256"), val = tensor([1, -1, 512])]; tensor var_2255_cast_fp16 = transpose(perm = var_2255_perm_0, x = x_247_cast_fp16)[name = tensor("transpose_153")]; tensor input_511_cast_fp16 = reshape(shape = var_2256, x = var_2255_cast_fp16)[name = tensor("input_511_cast_fp16")]; tensor encoder_layers_9_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_9_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(120755776)))]; tensor linear_88_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_self_attn_linear_out_weight_to_fp16, x = input_511_cast_fp16)[name = tensor("linear_88_cast_fp16")]; tensor input_515_cast_fp16 = add(x = input_505_cast_fp16, y = linear_88_cast_fp16)[name = tensor("input_515_cast_fp16")]; tensor x_251_axes_0 = const()[name = tensor("x_251_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121280128)))]; tensor encoder_layers_9_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121281216)))]; tensor x_251_cast_fp16 = layer_norm(axes = x_251_axes_0, beta = encoder_layers_9_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_norm_conv_weight_to_fp16, x = input_515_cast_fp16)[name = tensor("x_251_cast_fp16")]; tensor input_517_perm_0 = const()[name = tensor("input_517_perm_0"), val = tensor([0, 2, 1])]; tensor input_519_pad_type_0 = const()[name = tensor("input_519_pad_type_0"), val = tensor("valid")]; tensor input_519_strides_0 = const()[name = tensor("input_519_strides_0"), val = tensor([1])]; tensor input_519_pad_0 = const()[name = tensor("input_519_pad_0"), val = tensor([0, 0])]; tensor input_519_dilations_0 = const()[name = tensor("input_519_dilations_0"), val = tensor([1])]; tensor input_519_groups_0 = const()[name = tensor("input_519_groups_0"), val = tensor(1)]; tensor encoder_layers_9_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121282304)))]; tensor input_517_cast_fp16 = transpose(perm = input_517_perm_0, x = x_251_cast_fp16)[name = tensor("transpose_152")]; tensor input_519_cast_fp16 = conv(dilations = input_519_dilations_0, groups = input_519_groups_0, pad = input_519_pad_0, pad_type = input_519_pad_type_0, strides = input_519_strides_0, weight = encoder_layers_9_conv_pointwise_conv1_weight_to_fp16, x = input_517_cast_fp16)[name = tensor("input_519_cast_fp16")]; tensor x_253_split_num_splits_0 = const()[name = tensor("x_253_split_num_splits_0"), val = tensor(2)]; tensor x_253_split_axis_0 = const()[name = tensor("x_253_split_axis_0"), val = tensor(1)]; tensor x_253_split_cast_fp16_0, tensor x_253_split_cast_fp16_1 = split(axis = x_253_split_axis_0, num_splits = x_253_split_num_splits_0, x = input_519_cast_fp16)[name = tensor("x_253_split_cast_fp16")]; tensor x_253_split_1_sigmoid_cast_fp16 = sigmoid(x = x_253_split_cast_fp16_1)[name = tensor("x_253_split_1_sigmoid_cast_fp16")]; tensor x_253_cast_fp16 = mul(x = x_253_split_cast_fp16_0, y = x_253_split_1_sigmoid_cast_fp16)[name = tensor("x_253_cast_fp16")]; tensor input_521_cast_fp16 = select(a = var_40_to_fp16, b = x_253_cast_fp16, cond = var_418)[name = tensor("input_521_cast_fp16")]; tensor new_x_39_interleave_0 = const()[name = tensor("new_x_39_interleave_0"), val = tensor(false)]; tensor new_x_39_cast_fp16 = concat(axis = var_62, interleave = new_x_39_interleave_0, values = (cache_39_cast_fp16, input_521_cast_fp16))[name = tensor("new_x_39_cast_fp16")]; tensor next_cache_19_begin_0 = const()[name = tensor("next_cache_19_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_19_end_0 = const()[name = tensor("next_cache_19_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_19_end_mask_0 = const()[name = tensor("next_cache_19_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_19_cast_fp16 = slice_by_index(begin = next_cache_19_begin_0, end = next_cache_19_end_0, end_mask = next_cache_19_end_mask_0, x = new_x_39_cast_fp16)[name = tensor("next_cache_19_cast_fp16")]; tensor var_2297_begin_0 = const()[name = tensor("op_2297_begin_0"), val = tensor([0, 0, 1])]; tensor var_2297_end_0 = const()[name = tensor("op_2297_end_0"), val = tensor([1, 512, 9])]; tensor var_2297_end_mask_0 = const()[name = tensor("op_2297_end_mask_0"), val = tensor([true, true, true])]; tensor var_2297_cast_fp16 = slice_by_index(begin = var_2297_begin_0, end = var_2297_end_0, end_mask = var_2297_end_mask_0, x = next_cache_19_cast_fp16)[name = tensor("op_2297_cast_fp16")]; tensor x_255_pad_type_0 = const()[name = tensor("x_255_pad_type_0"), val = tensor("valid")]; tensor x_255_groups_0 = const()[name = tensor("x_255_groups_0"), val = tensor(512)]; tensor x_255_strides_0 = const()[name = tensor("x_255_strides_0"), val = tensor([1])]; tensor x_255_pad_0 = const()[name = tensor("x_255_pad_0"), val = tensor([0, 0])]; tensor x_255_dilations_0 = const()[name = tensor("x_255_dilations_0"), val = tensor([1])]; tensor encoder_layers_9_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_9_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122330944)))]; tensor x_255_cast_fp16 = conv(dilations = x_255_dilations_0, groups = x_255_groups_0, pad = x_255_pad_0, pad_type = x_255_pad_type_0, strides = x_255_strides_0, weight = encoder_layers_9_conv_depthwise_conv_weight_to_fp16, x = new_x_39_cast_fp16)[name = tensor("x_255_cast_fp16")]; tensor input_523_perm_0 = const()[name = tensor("input_523_perm_0"), val = tensor([0, 2, 1])]; tensor x_257_axes_0 = const()[name = tensor("x_257_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_9_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122340224)))]; tensor encoder_layers_9_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_9_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122341312)))]; tensor input_523_cast_fp16 = transpose(perm = input_523_perm_0, x = x_255_cast_fp16)[name = tensor("transpose_151")]; tensor x_257_cast_fp16 = layer_norm(axes = x_257_axes_0, beta = encoder_layers_9_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_conv_batch_norm_weight_to_fp16, x = input_523_cast_fp16)[name = tensor("x_257_cast_fp16")]; tensor input_525_perm_0 = const()[name = tensor("input_525_perm_0"), val = tensor([0, 2, 1])]; tensor input_525_cast_fp16 = transpose(perm = input_525_perm_0, x = x_257_cast_fp16)[name = tensor("transpose_150")]; tensor input_527_cast_fp16 = silu(x = input_525_cast_fp16)[name = tensor("input_527_cast_fp16")]; tensor x_259_pad_type_0 = const()[name = tensor("x_259_pad_type_0"), val = tensor("valid")]; tensor x_259_strides_0 = const()[name = tensor("x_259_strides_0"), val = tensor([1])]; tensor x_259_pad_0 = const()[name = tensor("x_259_pad_0"), val = tensor([0, 0])]; tensor x_259_dilations_0 = const()[name = tensor("x_259_dilations_0"), val = tensor([1])]; tensor x_259_groups_0 = const()[name = tensor("x_259_groups_0"), val = tensor(1)]; tensor encoder_layers_9_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122342400)))]; tensor x_259_cast_fp16 = conv(dilations = x_259_dilations_0, groups = x_259_groups_0, pad = x_259_pad_0, pad_type = x_259_pad_type_0, strides = x_259_strides_0, weight = encoder_layers_9_conv_pointwise_conv2_weight_to_fp16, x = input_527_cast_fp16)[name = tensor("x_259_cast_fp16")]; tensor input_529_perm_0 = const()[name = tensor("input_529_perm_0"), val = tensor([0, 2, 1])]; tensor input_529_cast_fp16 = transpose(perm = input_529_perm_0, x = x_259_cast_fp16)[name = tensor("transpose_149")]; tensor input_531_cast_fp16 = add(x = input_515_cast_fp16, y = input_529_cast_fp16)[name = tensor("input_531_cast_fp16")]; tensor input_533_axes_0 = const()[name = tensor("input_533_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122866752)))]; tensor encoder_layers_9_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122867840)))]; tensor input_533_cast_fp16 = layer_norm(axes = input_533_axes_0, beta = encoder_layers_9_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_norm_feed_forward2_weight_to_fp16, x = input_531_cast_fp16)[name = tensor("input_533_cast_fp16")]; tensor encoder_layers_9_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(122868928)))]; tensor linear_89_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_9_feed_forward2_linear1_weight_to_fp16, x = input_533_cast_fp16)[name = tensor("linear_89_cast_fp16")]; tensor input_537_cast_fp16 = silu(x = linear_89_cast_fp16)[name = tensor("input_537_cast_fp16")]; tensor encoder_layers_9_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_9_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124966144)))]; tensor linear_90_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_9_feed_forward2_linear2_weight_to_fp16, x = input_537_cast_fp16)[name = tensor("linear_90_cast_fp16")]; tensor var_2338_to_fp16 = const()[name = tensor("op_2338_to_fp16"), val = tensor(0x1p-1)]; tensor var_2339_cast_fp16 = mul(x = linear_90_cast_fp16, y = var_2338_to_fp16)[name = tensor("op_2339_cast_fp16")]; tensor input_543_cast_fp16 = add(x = input_531_cast_fp16, y = var_2339_cast_fp16)[name = tensor("input_543_cast_fp16")]; tensor input_545_axes_0 = const()[name = tensor("input_545_axes_0"), val = tensor([-1])]; tensor encoder_layers_9_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_9_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127063360)))]; tensor encoder_layers_9_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_9_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127064448)))]; tensor input_545_cast_fp16 = layer_norm(axes = input_545_axes_0, beta = encoder_layers_9_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_9_norm_out_weight_to_fp16, x = input_543_cast_fp16)[name = tensor("input_545_cast_fp16")]; tensor cache_41_begin_0 = const()[name = tensor("cache_41_begin_0"), val = tensor([10, 0, 0, 0])]; tensor cache_41_end_0 = const()[name = tensor("cache_41_end_0"), val = tensor([11, 1, 70, 512])]; tensor cache_41_end_mask_0 = const()[name = tensor("cache_41_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_41_squeeze_mask_0 = const()[name = tensor("cache_41_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_41_cast_fp16 = slice_by_index(begin = cache_41_begin_0, end = cache_41_end_0, end_mask = cache_41_end_mask_0, squeeze_mask = cache_41_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_41_cast_fp16")]; tensor cache_43_begin_0 = const()[name = tensor("cache_43_begin_0"), val = tensor([10, 0, 0, 0])]; tensor cache_43_end_0 = const()[name = tensor("cache_43_end_0"), val = tensor([11, 1, 512, 8])]; tensor cache_43_end_mask_0 = const()[name = tensor("cache_43_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_43_squeeze_mask_0 = const()[name = tensor("cache_43_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_43_cast_fp16 = slice_by_index(begin = cache_43_begin_0, end = cache_43_end_0, end_mask = cache_43_end_mask_0, squeeze_mask = cache_43_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_43_cast_fp16")]; tensor input_547_axes_0 = const()[name = tensor("input_547_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127065536)))]; tensor encoder_layers_10_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127066624)))]; tensor input_547_cast_fp16 = layer_norm(axes = input_547_axes_0, beta = encoder_layers_10_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_norm_feed_forward1_weight_to_fp16, x = input_545_cast_fp16)[name = tensor("input_547_cast_fp16")]; tensor encoder_layers_10_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127067712)))]; tensor linear_91_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_10_feed_forward1_linear1_weight_to_fp16, x = input_547_cast_fp16)[name = tensor("linear_91_cast_fp16")]; tensor input_551_cast_fp16 = silu(x = linear_91_cast_fp16)[name = tensor("input_551_cast_fp16")]; tensor encoder_layers_10_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(129164928)))]; tensor linear_92_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_feed_forward1_linear2_weight_to_fp16, x = input_551_cast_fp16)[name = tensor("linear_92_cast_fp16")]; tensor var_2373_to_fp16 = const()[name = tensor("op_2373_to_fp16"), val = tensor(0x1p-1)]; tensor var_2374_cast_fp16 = mul(x = linear_92_cast_fp16, y = var_2373_to_fp16)[name = tensor("op_2374_cast_fp16")]; tensor input_557_cast_fp16 = add(x = input_545_cast_fp16, y = var_2374_cast_fp16)[name = tensor("input_557_cast_fp16")]; tensor key_21_axes_0 = const()[name = tensor("key_21_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131262144)))]; tensor encoder_layers_10_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131263232)))]; tensor key_21_cast_fp16 = layer_norm(axes = key_21_axes_0, beta = encoder_layers_10_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_norm_self_att_weight_to_fp16, x = input_557_cast_fp16)[name = tensor("key_21_cast_fp16")]; tensor input_559_interleave_0 = const()[name = tensor("input_559_interleave_0"), val = tensor(false)]; tensor input_559_cast_fp16 = concat(axis = var_64, interleave = input_559_interleave_0, values = (cache_41_cast_fp16, key_21_cast_fp16))[name = tensor("input_559_cast_fp16")]; tensor var_2396_begin_0 = const()[name = tensor("op_2396_begin_0"), val = tensor([0, 1, 0])]; tensor var_2396_end_0 = const()[name = tensor("op_2396_end_0"), val = tensor([1, 70, 512])]; tensor var_2396_end_mask_0 = const()[name = tensor("op_2396_end_mask_0"), val = tensor([true, true, true])]; tensor var_2396_cast_fp16 = slice_by_index(begin = var_2396_begin_0, end = var_2396_end_0, end_mask = var_2396_end_mask_0, x = cache_41_cast_fp16)[name = tensor("op_2396_cast_fp16")]; tensor var_2399_begin_0 = const()[name = tensor("op_2399_begin_0"), val = tensor([0, 0, 0])]; tensor var_2399_end_0 = const()[name = tensor("op_2399_end_0"), val = tensor([1, 1, 512])]; tensor var_2399_end_mask_0 = const()[name = tensor("op_2399_end_mask_0"), val = tensor([true, false, true])]; tensor var_2399_cast_fp16 = slice_by_index(begin = var_2399_begin_0, end = var_2399_end_0, end_mask = var_2399_end_mask_0, x = key_21_cast_fp16)[name = tensor("op_2399_cast_fp16")]; tensor var_2402_interleave_0 = const()[name = tensor("op_2402_interleave_0"), val = tensor(false)]; tensor var_2402_cast_fp16 = concat(axis = var_64, interleave = var_2402_interleave_0, values = (var_2396_cast_fp16, var_2399_cast_fp16))[name = tensor("op_2402_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131264320)))]; tensor linear_93_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_self_attn_linear_q_weight_to_fp16, x = key_21_cast_fp16)[name = tensor("linear_93_cast_fp16")]; tensor var_2406 = const()[name = tensor("op_2406"), val = tensor([1, -1, 8, 64])]; tensor q_61_cast_fp16 = reshape(shape = var_2406, x = linear_93_cast_fp16)[name = tensor("q_61_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131788672)))]; tensor linear_94_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_self_attn_linear_k_weight_to_fp16, x = input_559_cast_fp16)[name = tensor("linear_94_cast_fp16")]; tensor var_2410 = const()[name = tensor("op_2410"), val = tensor([1, -1, 8, 64])]; tensor k_41_cast_fp16 = reshape(shape = var_2410, x = linear_94_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132313024)))]; tensor linear_95_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_self_attn_linear_v_weight_to_fp16, x = input_559_cast_fp16)[name = tensor("linear_95_cast_fp16")]; tensor var_2414 = const()[name = tensor("op_2414"), val = tensor([1, -1, 8, 64])]; tensor v_21_cast_fp16 = reshape(shape = var_2414, x = linear_95_cast_fp16)[name = tensor("v_21_cast_fp16")]; tensor value_23_perm_0 = const()[name = tensor("value_23_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_10_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132837376)))]; tensor var_2426_cast_fp16 = add(x = q_61_cast_fp16, y = encoder_layers_10_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2426_cast_fp16")]; tensor encoder_layers_10_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132838464)))]; tensor var_2428_cast_fp16 = add(x = q_61_cast_fp16, y = encoder_layers_10_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2428_cast_fp16")]; tensor q_with_bias_v_21_perm_0 = const()[name = tensor("q_with_bias_v_21_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_267_transpose_x_0 = const()[name = tensor("x_267_transpose_x_0"), val = tensor(false)]; tensor x_267_transpose_y_0 = const()[name = tensor("x_267_transpose_y_0"), val = tensor(false)]; tensor var_2430_to_fp16 = const()[name = tensor("op_2430_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132839552)))]; tensor q_with_bias_v_21_cast_fp16 = transpose(perm = q_with_bias_v_21_perm_0, x = var_2428_cast_fp16)[name = tensor("transpose_147")]; tensor x_267_cast_fp16 = matmul(transpose_x = x_267_transpose_x_0, transpose_y = x_267_transpose_y_0, x = q_with_bias_v_21_cast_fp16, y = var_2430_to_fp16)[name = tensor("x_267_cast_fp16")]; tensor x_269_pad_0 = const()[name = tensor("x_269_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_269_mode_0 = const()[name = tensor("x_269_mode_0"), val = tensor("constant")]; tensor const_153_to_fp16 = const()[name = tensor("const_153_to_fp16"), val = tensor(0x0p+0)]; tensor x_269_cast_fp16 = pad(constant_val = const_153_to_fp16, mode = x_269_mode_0, pad = x_269_pad_0, x = x_267_cast_fp16)[name = tensor("x_269_cast_fp16")]; tensor var_2438 = const()[name = tensor("op_2438"), val = tensor([1, 8, -1, 3])]; tensor x_271_cast_fp16 = reshape(shape = var_2438, x = x_269_cast_fp16)[name = tensor("x_271_cast_fp16")]; tensor var_2442_begin_0 = const()[name = tensor("op_2442_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2442_end_0 = const()[name = tensor("op_2442_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_2442_end_mask_0 = const()[name = tensor("op_2442_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2442_cast_fp16 = slice_by_index(begin = var_2442_begin_0, end = var_2442_end_0, end_mask = var_2442_end_mask_0, x = x_271_cast_fp16)[name = tensor("op_2442_cast_fp16")]; tensor var_2443 = const()[name = tensor("op_2443"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_41_cast_fp16 = reshape(shape = var_2443, x = var_2442_cast_fp16)[name = tensor("matrix_bd_41_cast_fp16")]; tensor matrix_ac_21_transpose_x_0 = const()[name = tensor("matrix_ac_21_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_21_transpose_y_0 = const()[name = tensor("matrix_ac_21_transpose_y_0"), val = tensor(false)]; tensor transpose_71_perm_0 = const()[name = tensor("transpose_71_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_72_perm_0 = const()[name = tensor("transpose_72_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_72 = transpose(perm = transpose_72_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_145")]; tensor transpose_71 = transpose(perm = transpose_71_perm_0, x = var_2426_cast_fp16)[name = tensor("transpose_146")]; tensor matrix_ac_21_cast_fp16 = matmul(transpose_x = matrix_ac_21_transpose_x_0, transpose_y = matrix_ac_21_transpose_y_0, x = transpose_71, y = transpose_72)[name = tensor("matrix_ac_21_cast_fp16")]; tensor matrix_bd_43_begin_0 = const()[name = tensor("matrix_bd_43_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_43_end_0 = const()[name = tensor("matrix_bd_43_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_43_end_mask_0 = const()[name = tensor("matrix_bd_43_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_43_cast_fp16 = slice_by_index(begin = matrix_bd_43_begin_0, end = matrix_bd_43_end_0, end_mask = matrix_bd_43_end_mask_0, x = matrix_bd_41_cast_fp16)[name = tensor("matrix_bd_43_cast_fp16")]; tensor var_2452_cast_fp16 = add(x = matrix_ac_21_cast_fp16, y = matrix_bd_43_cast_fp16)[name = tensor("op_2452_cast_fp16")]; tensor _inversed_scores_41_y_0_to_fp16 = const()[name = tensor("_inversed_scores_41_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_41_cast_fp16 = mul(x = var_2452_cast_fp16, y = _inversed_scores_41_y_0_to_fp16)[name = tensor("_inversed_scores_41_cast_fp16")]; tensor scores_43_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_41_cast_fp16, cond = mask_3)[name = tensor("scores_43_cast_fp16")]; tensor var_2458_cast_fp16 = softmax(axis = var_62, x = scores_43_cast_fp16)[name = tensor("op_2458_cast_fp16")]; tensor input_561_cast_fp16 = select(a = var_40_to_fp16, b = var_2458_cast_fp16, cond = mask_3)[name = tensor("input_561_cast_fp16")]; tensor x_273_transpose_x_0 = const()[name = tensor("x_273_transpose_x_0"), val = tensor(false)]; tensor x_273_transpose_y_0 = const()[name = tensor("x_273_transpose_y_0"), val = tensor(false)]; tensor value_23_cast_fp16 = transpose(perm = value_23_perm_0, x = v_21_cast_fp16)[name = tensor("transpose_148")]; tensor x_273_cast_fp16 = matmul(transpose_x = x_273_transpose_x_0, transpose_y = x_273_transpose_y_0, x = input_561_cast_fp16, y = value_23_cast_fp16)[name = tensor("x_273_cast_fp16")]; tensor var_2462_perm_0 = const()[name = tensor("op_2462_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2463 = const()[name = tensor("op_2463"), val = tensor([1, -1, 512])]; tensor var_2462_cast_fp16 = transpose(perm = var_2462_perm_0, x = x_273_cast_fp16)[name = tensor("transpose_144")]; tensor input_563_cast_fp16 = reshape(shape = var_2463, x = var_2462_cast_fp16)[name = tensor("input_563_cast_fp16")]; tensor encoder_layers_10_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_10_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132988096)))]; tensor linear_97_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_self_attn_linear_out_weight_to_fp16, x = input_563_cast_fp16)[name = tensor("linear_97_cast_fp16")]; tensor input_567_cast_fp16 = add(x = input_557_cast_fp16, y = linear_97_cast_fp16)[name = tensor("input_567_cast_fp16")]; tensor x_277_axes_0 = const()[name = tensor("x_277_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133512448)))]; tensor encoder_layers_10_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133513536)))]; tensor x_277_cast_fp16 = layer_norm(axes = x_277_axes_0, beta = encoder_layers_10_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_norm_conv_weight_to_fp16, x = input_567_cast_fp16)[name = tensor("x_277_cast_fp16")]; tensor input_569_perm_0 = const()[name = tensor("input_569_perm_0"), val = tensor([0, 2, 1])]; tensor input_571_pad_type_0 = const()[name = tensor("input_571_pad_type_0"), val = tensor("valid")]; tensor input_571_strides_0 = const()[name = tensor("input_571_strides_0"), val = tensor([1])]; tensor input_571_pad_0 = const()[name = tensor("input_571_pad_0"), val = tensor([0, 0])]; tensor input_571_dilations_0 = const()[name = tensor("input_571_dilations_0"), val = tensor([1])]; tensor input_571_groups_0 = const()[name = tensor("input_571_groups_0"), val = tensor(1)]; tensor encoder_layers_10_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133514624)))]; tensor input_569_cast_fp16 = transpose(perm = input_569_perm_0, x = x_277_cast_fp16)[name = tensor("transpose_143")]; tensor input_571_cast_fp16 = conv(dilations = input_571_dilations_0, groups = input_571_groups_0, pad = input_571_pad_0, pad_type = input_571_pad_type_0, strides = input_571_strides_0, weight = encoder_layers_10_conv_pointwise_conv1_weight_to_fp16, x = input_569_cast_fp16)[name = tensor("input_571_cast_fp16")]; tensor x_279_split_num_splits_0 = const()[name = tensor("x_279_split_num_splits_0"), val = tensor(2)]; tensor x_279_split_axis_0 = const()[name = tensor("x_279_split_axis_0"), val = tensor(1)]; tensor x_279_split_cast_fp16_0, tensor x_279_split_cast_fp16_1 = split(axis = x_279_split_axis_0, num_splits = x_279_split_num_splits_0, x = input_571_cast_fp16)[name = tensor("x_279_split_cast_fp16")]; tensor x_279_split_1_sigmoid_cast_fp16 = sigmoid(x = x_279_split_cast_fp16_1)[name = tensor("x_279_split_1_sigmoid_cast_fp16")]; tensor x_279_cast_fp16 = mul(x = x_279_split_cast_fp16_0, y = x_279_split_1_sigmoid_cast_fp16)[name = tensor("x_279_cast_fp16")]; tensor input_573_cast_fp16 = select(a = var_40_to_fp16, b = x_279_cast_fp16, cond = var_418)[name = tensor("input_573_cast_fp16")]; tensor new_x_43_interleave_0 = const()[name = tensor("new_x_43_interleave_0"), val = tensor(false)]; tensor new_x_43_cast_fp16 = concat(axis = var_62, interleave = new_x_43_interleave_0, values = (cache_43_cast_fp16, input_573_cast_fp16))[name = tensor("new_x_43_cast_fp16")]; tensor next_cache_21_begin_0 = const()[name = tensor("next_cache_21_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_21_end_0 = const()[name = tensor("next_cache_21_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_21_end_mask_0 = const()[name = tensor("next_cache_21_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_21_cast_fp16 = slice_by_index(begin = next_cache_21_begin_0, end = next_cache_21_end_0, end_mask = next_cache_21_end_mask_0, x = new_x_43_cast_fp16)[name = tensor("next_cache_21_cast_fp16")]; tensor var_2504_begin_0 = const()[name = tensor("op_2504_begin_0"), val = tensor([0, 0, 1])]; tensor var_2504_end_0 = const()[name = tensor("op_2504_end_0"), val = tensor([1, 512, 9])]; tensor var_2504_end_mask_0 = const()[name = tensor("op_2504_end_mask_0"), val = tensor([true, true, true])]; tensor var_2504_cast_fp16 = slice_by_index(begin = var_2504_begin_0, end = var_2504_end_0, end_mask = var_2504_end_mask_0, x = next_cache_21_cast_fp16)[name = tensor("op_2504_cast_fp16")]; tensor x_281_pad_type_0 = const()[name = tensor("x_281_pad_type_0"), val = tensor("valid")]; tensor x_281_groups_0 = const()[name = tensor("x_281_groups_0"), val = tensor(512)]; tensor x_281_strides_0 = const()[name = tensor("x_281_strides_0"), val = tensor([1])]; tensor x_281_pad_0 = const()[name = tensor("x_281_pad_0"), val = tensor([0, 0])]; tensor x_281_dilations_0 = const()[name = tensor("x_281_dilations_0"), val = tensor([1])]; tensor encoder_layers_10_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_10_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134563264)))]; tensor x_281_cast_fp16 = conv(dilations = x_281_dilations_0, groups = x_281_groups_0, pad = x_281_pad_0, pad_type = x_281_pad_type_0, strides = x_281_strides_0, weight = encoder_layers_10_conv_depthwise_conv_weight_to_fp16, x = new_x_43_cast_fp16)[name = tensor("x_281_cast_fp16")]; tensor input_575_perm_0 = const()[name = tensor("input_575_perm_0"), val = tensor([0, 2, 1])]; tensor x_283_axes_0 = const()[name = tensor("x_283_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_10_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134572544)))]; tensor encoder_layers_10_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_10_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134573632)))]; tensor input_575_cast_fp16 = transpose(perm = input_575_perm_0, x = x_281_cast_fp16)[name = tensor("transpose_142")]; tensor x_283_cast_fp16 = layer_norm(axes = x_283_axes_0, beta = encoder_layers_10_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_conv_batch_norm_weight_to_fp16, x = input_575_cast_fp16)[name = tensor("x_283_cast_fp16")]; tensor input_577_perm_0 = const()[name = tensor("input_577_perm_0"), val = tensor([0, 2, 1])]; tensor input_577_cast_fp16 = transpose(perm = input_577_perm_0, x = x_283_cast_fp16)[name = tensor("transpose_141")]; tensor input_579_cast_fp16 = silu(x = input_577_cast_fp16)[name = tensor("input_579_cast_fp16")]; tensor x_285_pad_type_0 = const()[name = tensor("x_285_pad_type_0"), val = tensor("valid")]; tensor x_285_strides_0 = const()[name = tensor("x_285_strides_0"), val = tensor([1])]; tensor x_285_pad_0 = const()[name = tensor("x_285_pad_0"), val = tensor([0, 0])]; tensor x_285_dilations_0 = const()[name = tensor("x_285_dilations_0"), val = tensor([1])]; tensor x_285_groups_0 = const()[name = tensor("x_285_groups_0"), val = tensor(1)]; tensor encoder_layers_10_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134574720)))]; tensor x_285_cast_fp16 = conv(dilations = x_285_dilations_0, groups = x_285_groups_0, pad = x_285_pad_0, pad_type = x_285_pad_type_0, strides = x_285_strides_0, weight = encoder_layers_10_conv_pointwise_conv2_weight_to_fp16, x = input_579_cast_fp16)[name = tensor("x_285_cast_fp16")]; tensor input_581_perm_0 = const()[name = tensor("input_581_perm_0"), val = tensor([0, 2, 1])]; tensor input_581_cast_fp16 = transpose(perm = input_581_perm_0, x = x_285_cast_fp16)[name = tensor("transpose_140")]; tensor input_583_cast_fp16 = add(x = input_567_cast_fp16, y = input_581_cast_fp16)[name = tensor("input_583_cast_fp16")]; tensor input_585_axes_0 = const()[name = tensor("input_585_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135099072)))]; tensor encoder_layers_10_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135100160)))]; tensor input_585_cast_fp16 = layer_norm(axes = input_585_axes_0, beta = encoder_layers_10_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_norm_feed_forward2_weight_to_fp16, x = input_583_cast_fp16)[name = tensor("input_585_cast_fp16")]; tensor encoder_layers_10_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135101248)))]; tensor linear_98_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_10_feed_forward2_linear1_weight_to_fp16, x = input_585_cast_fp16)[name = tensor("linear_98_cast_fp16")]; tensor input_589_cast_fp16 = silu(x = linear_98_cast_fp16)[name = tensor("input_589_cast_fp16")]; tensor encoder_layers_10_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_10_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137198464)))]; tensor linear_99_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_10_feed_forward2_linear2_weight_to_fp16, x = input_589_cast_fp16)[name = tensor("linear_99_cast_fp16")]; tensor var_2545_to_fp16 = const()[name = tensor("op_2545_to_fp16"), val = tensor(0x1p-1)]; tensor var_2546_cast_fp16 = mul(x = linear_99_cast_fp16, y = var_2545_to_fp16)[name = tensor("op_2546_cast_fp16")]; tensor input_595_cast_fp16 = add(x = input_583_cast_fp16, y = var_2546_cast_fp16)[name = tensor("input_595_cast_fp16")]; tensor input_597_axes_0 = const()[name = tensor("input_597_axes_0"), val = tensor([-1])]; tensor encoder_layers_10_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_10_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139295680)))]; tensor encoder_layers_10_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_10_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139296768)))]; tensor input_597_cast_fp16 = layer_norm(axes = input_597_axes_0, beta = encoder_layers_10_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_10_norm_out_weight_to_fp16, x = input_595_cast_fp16)[name = tensor("input_597_cast_fp16")]; tensor cache_45_begin_0 = const()[name = tensor("cache_45_begin_0"), val = tensor([11, 0, 0, 0])]; tensor cache_45_end_0 = const()[name = tensor("cache_45_end_0"), val = tensor([12, 1, 70, 512])]; tensor cache_45_end_mask_0 = const()[name = tensor("cache_45_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_45_squeeze_mask_0 = const()[name = tensor("cache_45_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_45_cast_fp16 = slice_by_index(begin = cache_45_begin_0, end = cache_45_end_0, end_mask = cache_45_end_mask_0, squeeze_mask = cache_45_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_45_cast_fp16")]; tensor cache_47_begin_0 = const()[name = tensor("cache_47_begin_0"), val = tensor([11, 0, 0, 0])]; tensor cache_47_end_0 = const()[name = tensor("cache_47_end_0"), val = tensor([12, 1, 512, 8])]; tensor cache_47_end_mask_0 = const()[name = tensor("cache_47_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_47_squeeze_mask_0 = const()[name = tensor("cache_47_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_47_cast_fp16 = slice_by_index(begin = cache_47_begin_0, end = cache_47_end_0, end_mask = cache_47_end_mask_0, squeeze_mask = cache_47_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_47_cast_fp16")]; tensor input_599_axes_0 = const()[name = tensor("input_599_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139297856)))]; tensor encoder_layers_11_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139298944)))]; tensor input_599_cast_fp16 = layer_norm(axes = input_599_axes_0, beta = encoder_layers_11_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_norm_feed_forward1_weight_to_fp16, x = input_597_cast_fp16)[name = tensor("input_599_cast_fp16")]; tensor encoder_layers_11_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139300032)))]; tensor linear_100_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_11_feed_forward1_linear1_weight_to_fp16, x = input_599_cast_fp16)[name = tensor("linear_100_cast_fp16")]; tensor input_603_cast_fp16 = silu(x = linear_100_cast_fp16)[name = tensor("input_603_cast_fp16")]; tensor encoder_layers_11_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141397248)))]; tensor linear_101_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_feed_forward1_linear2_weight_to_fp16, x = input_603_cast_fp16)[name = tensor("linear_101_cast_fp16")]; tensor var_2580_to_fp16 = const()[name = tensor("op_2580_to_fp16"), val = tensor(0x1p-1)]; tensor var_2581_cast_fp16 = mul(x = linear_101_cast_fp16, y = var_2580_to_fp16)[name = tensor("op_2581_cast_fp16")]; tensor input_609_cast_fp16 = add(x = input_597_cast_fp16, y = var_2581_cast_fp16)[name = tensor("input_609_cast_fp16")]; tensor key_23_axes_0 = const()[name = tensor("key_23_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143494464)))]; tensor encoder_layers_11_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143495552)))]; tensor key_23_cast_fp16 = layer_norm(axes = key_23_axes_0, beta = encoder_layers_11_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_norm_self_att_weight_to_fp16, x = input_609_cast_fp16)[name = tensor("key_23_cast_fp16")]; tensor input_611_interleave_0 = const()[name = tensor("input_611_interleave_0"), val = tensor(false)]; tensor input_611_cast_fp16 = concat(axis = var_64, interleave = input_611_interleave_0, values = (cache_45_cast_fp16, key_23_cast_fp16))[name = tensor("input_611_cast_fp16")]; tensor var_2603_begin_0 = const()[name = tensor("op_2603_begin_0"), val = tensor([0, 1, 0])]; tensor var_2603_end_0 = const()[name = tensor("op_2603_end_0"), val = tensor([1, 70, 512])]; tensor var_2603_end_mask_0 = const()[name = tensor("op_2603_end_mask_0"), val = tensor([true, true, true])]; tensor var_2603_cast_fp16 = slice_by_index(begin = var_2603_begin_0, end = var_2603_end_0, end_mask = var_2603_end_mask_0, x = cache_45_cast_fp16)[name = tensor("op_2603_cast_fp16")]; tensor var_2606_begin_0 = const()[name = tensor("op_2606_begin_0"), val = tensor([0, 0, 0])]; tensor var_2606_end_0 = const()[name = tensor("op_2606_end_0"), val = tensor([1, 1, 512])]; tensor var_2606_end_mask_0 = const()[name = tensor("op_2606_end_mask_0"), val = tensor([true, false, true])]; tensor var_2606_cast_fp16 = slice_by_index(begin = var_2606_begin_0, end = var_2606_end_0, end_mask = var_2606_end_mask_0, x = key_23_cast_fp16)[name = tensor("op_2606_cast_fp16")]; tensor var_2609_interleave_0 = const()[name = tensor("op_2609_interleave_0"), val = tensor(false)]; tensor var_2609_cast_fp16 = concat(axis = var_64, interleave = var_2609_interleave_0, values = (var_2603_cast_fp16, var_2606_cast_fp16))[name = tensor("op_2609_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(143496640)))]; tensor linear_102_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_self_attn_linear_q_weight_to_fp16, x = key_23_cast_fp16)[name = tensor("linear_102_cast_fp16")]; tensor var_2613 = const()[name = tensor("op_2613"), val = tensor([1, -1, 8, 64])]; tensor q_67_cast_fp16 = reshape(shape = var_2613, x = linear_102_cast_fp16)[name = tensor("q_67_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144020992)))]; tensor linear_103_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_self_attn_linear_k_weight_to_fp16, x = input_611_cast_fp16)[name = tensor("linear_103_cast_fp16")]; tensor var_2617 = const()[name = tensor("op_2617"), val = tensor([1, -1, 8, 64])]; tensor k_45_cast_fp16 = reshape(shape = var_2617, x = linear_103_cast_fp16)[name = tensor("k_45_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144545344)))]; tensor linear_104_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_self_attn_linear_v_weight_to_fp16, x = input_611_cast_fp16)[name = tensor("linear_104_cast_fp16")]; tensor var_2621 = const()[name = tensor("op_2621"), val = tensor([1, -1, 8, 64])]; tensor v_23_cast_fp16 = reshape(shape = var_2621, x = linear_104_cast_fp16)[name = tensor("v_23_cast_fp16")]; tensor value_25_perm_0 = const()[name = tensor("value_25_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_11_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145069696)))]; tensor var_2633_cast_fp16 = add(x = q_67_cast_fp16, y = encoder_layers_11_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2633_cast_fp16")]; tensor encoder_layers_11_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145070784)))]; tensor var_2635_cast_fp16 = add(x = q_67_cast_fp16, y = encoder_layers_11_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2635_cast_fp16")]; tensor q_with_bias_v_23_perm_0 = const()[name = tensor("q_with_bias_v_23_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_293_transpose_x_0 = const()[name = tensor("x_293_transpose_x_0"), val = tensor(false)]; tensor x_293_transpose_y_0 = const()[name = tensor("x_293_transpose_y_0"), val = tensor(false)]; tensor var_2637_to_fp16 = const()[name = tensor("op_2637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145071872)))]; tensor q_with_bias_v_23_cast_fp16 = transpose(perm = q_with_bias_v_23_perm_0, x = var_2635_cast_fp16)[name = tensor("transpose_138")]; tensor x_293_cast_fp16 = matmul(transpose_x = x_293_transpose_x_0, transpose_y = x_293_transpose_y_0, x = q_with_bias_v_23_cast_fp16, y = var_2637_to_fp16)[name = tensor("x_293_cast_fp16")]; tensor x_295_pad_0 = const()[name = tensor("x_295_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_295_mode_0 = const()[name = tensor("x_295_mode_0"), val = tensor("constant")]; tensor const_166_to_fp16 = const()[name = tensor("const_166_to_fp16"), val = tensor(0x0p+0)]; tensor x_295_cast_fp16 = pad(constant_val = const_166_to_fp16, mode = x_295_mode_0, pad = x_295_pad_0, x = x_293_cast_fp16)[name = tensor("x_295_cast_fp16")]; tensor var_2645 = const()[name = tensor("op_2645"), val = tensor([1, 8, -1, 3])]; tensor x_297_cast_fp16 = reshape(shape = var_2645, x = x_295_cast_fp16)[name = tensor("x_297_cast_fp16")]; tensor var_2649_begin_0 = const()[name = tensor("op_2649_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2649_end_0 = const()[name = tensor("op_2649_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_2649_end_mask_0 = const()[name = tensor("op_2649_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2649_cast_fp16 = slice_by_index(begin = var_2649_begin_0, end = var_2649_end_0, end_mask = var_2649_end_mask_0, x = x_297_cast_fp16)[name = tensor("op_2649_cast_fp16")]; tensor var_2650 = const()[name = tensor("op_2650"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_45_cast_fp16 = reshape(shape = var_2650, x = var_2649_cast_fp16)[name = tensor("matrix_bd_45_cast_fp16")]; tensor matrix_ac_23_transpose_x_0 = const()[name = tensor("matrix_ac_23_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_23_transpose_y_0 = const()[name = tensor("matrix_ac_23_transpose_y_0"), val = tensor(false)]; tensor transpose_73_perm_0 = const()[name = tensor("transpose_73_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_74_perm_0 = const()[name = tensor("transpose_74_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_74 = transpose(perm = transpose_74_perm_0, x = k_45_cast_fp16)[name = tensor("transpose_136")]; tensor transpose_73 = transpose(perm = transpose_73_perm_0, x = var_2633_cast_fp16)[name = tensor("transpose_137")]; tensor matrix_ac_23_cast_fp16 = matmul(transpose_x = matrix_ac_23_transpose_x_0, transpose_y = matrix_ac_23_transpose_y_0, x = transpose_73, y = transpose_74)[name = tensor("matrix_ac_23_cast_fp16")]; tensor matrix_bd_47_begin_0 = const()[name = tensor("matrix_bd_47_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_47_end_0 = const()[name = tensor("matrix_bd_47_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_47_end_mask_0 = const()[name = tensor("matrix_bd_47_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_47_cast_fp16 = slice_by_index(begin = matrix_bd_47_begin_0, end = matrix_bd_47_end_0, end_mask = matrix_bd_47_end_mask_0, x = matrix_bd_45_cast_fp16)[name = tensor("matrix_bd_47_cast_fp16")]; tensor var_2659_cast_fp16 = add(x = matrix_ac_23_cast_fp16, y = matrix_bd_47_cast_fp16)[name = tensor("op_2659_cast_fp16")]; tensor _inversed_scores_45_y_0_to_fp16 = const()[name = tensor("_inversed_scores_45_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_45_cast_fp16 = mul(x = var_2659_cast_fp16, y = _inversed_scores_45_y_0_to_fp16)[name = tensor("_inversed_scores_45_cast_fp16")]; tensor scores_47_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_45_cast_fp16, cond = mask_3)[name = tensor("scores_47_cast_fp16")]; tensor var_2665_cast_fp16 = softmax(axis = var_62, x = scores_47_cast_fp16)[name = tensor("op_2665_cast_fp16")]; tensor input_613_cast_fp16 = select(a = var_40_to_fp16, b = var_2665_cast_fp16, cond = mask_3)[name = tensor("input_613_cast_fp16")]; tensor x_299_transpose_x_0 = const()[name = tensor("x_299_transpose_x_0"), val = tensor(false)]; tensor x_299_transpose_y_0 = const()[name = tensor("x_299_transpose_y_0"), val = tensor(false)]; tensor value_25_cast_fp16 = transpose(perm = value_25_perm_0, x = v_23_cast_fp16)[name = tensor("transpose_139")]; tensor x_299_cast_fp16 = matmul(transpose_x = x_299_transpose_x_0, transpose_y = x_299_transpose_y_0, x = input_613_cast_fp16, y = value_25_cast_fp16)[name = tensor("x_299_cast_fp16")]; tensor var_2669_perm_0 = const()[name = tensor("op_2669_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2670 = const()[name = tensor("op_2670"), val = tensor([1, -1, 512])]; tensor var_2669_cast_fp16 = transpose(perm = var_2669_perm_0, x = x_299_cast_fp16)[name = tensor("transpose_135")]; tensor input_615_cast_fp16 = reshape(shape = var_2670, x = var_2669_cast_fp16)[name = tensor("input_615_cast_fp16")]; tensor encoder_layers_11_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_11_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145220416)))]; tensor linear_106_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_self_attn_linear_out_weight_to_fp16, x = input_615_cast_fp16)[name = tensor("linear_106_cast_fp16")]; tensor input_619_cast_fp16 = add(x = input_609_cast_fp16, y = linear_106_cast_fp16)[name = tensor("input_619_cast_fp16")]; tensor x_303_axes_0 = const()[name = tensor("x_303_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145744768)))]; tensor encoder_layers_11_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145745856)))]; tensor x_303_cast_fp16 = layer_norm(axes = x_303_axes_0, beta = encoder_layers_11_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_norm_conv_weight_to_fp16, x = input_619_cast_fp16)[name = tensor("x_303_cast_fp16")]; tensor input_621_perm_0 = const()[name = tensor("input_621_perm_0"), val = tensor([0, 2, 1])]; tensor input_623_pad_type_0 = const()[name = tensor("input_623_pad_type_0"), val = tensor("valid")]; tensor input_623_strides_0 = const()[name = tensor("input_623_strides_0"), val = tensor([1])]; tensor input_623_pad_0 = const()[name = tensor("input_623_pad_0"), val = tensor([0, 0])]; tensor input_623_dilations_0 = const()[name = tensor("input_623_dilations_0"), val = tensor([1])]; tensor input_623_groups_0 = const()[name = tensor("input_623_groups_0"), val = tensor(1)]; tensor encoder_layers_11_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145746944)))]; tensor input_621_cast_fp16 = transpose(perm = input_621_perm_0, x = x_303_cast_fp16)[name = tensor("transpose_134")]; tensor input_623_cast_fp16 = conv(dilations = input_623_dilations_0, groups = input_623_groups_0, pad = input_623_pad_0, pad_type = input_623_pad_type_0, strides = input_623_strides_0, weight = encoder_layers_11_conv_pointwise_conv1_weight_to_fp16, x = input_621_cast_fp16)[name = tensor("input_623_cast_fp16")]; tensor x_305_split_num_splits_0 = const()[name = tensor("x_305_split_num_splits_0"), val = tensor(2)]; tensor x_305_split_axis_0 = const()[name = tensor("x_305_split_axis_0"), val = tensor(1)]; tensor x_305_split_cast_fp16_0, tensor x_305_split_cast_fp16_1 = split(axis = x_305_split_axis_0, num_splits = x_305_split_num_splits_0, x = input_623_cast_fp16)[name = tensor("x_305_split_cast_fp16")]; tensor x_305_split_1_sigmoid_cast_fp16 = sigmoid(x = x_305_split_cast_fp16_1)[name = tensor("x_305_split_1_sigmoid_cast_fp16")]; tensor x_305_cast_fp16 = mul(x = x_305_split_cast_fp16_0, y = x_305_split_1_sigmoid_cast_fp16)[name = tensor("x_305_cast_fp16")]; tensor input_625_cast_fp16 = select(a = var_40_to_fp16, b = x_305_cast_fp16, cond = var_418)[name = tensor("input_625_cast_fp16")]; tensor new_x_47_interleave_0 = const()[name = tensor("new_x_47_interleave_0"), val = tensor(false)]; tensor new_x_47_cast_fp16 = concat(axis = var_62, interleave = new_x_47_interleave_0, values = (cache_47_cast_fp16, input_625_cast_fp16))[name = tensor("new_x_47_cast_fp16")]; tensor next_cache_23_begin_0 = const()[name = tensor("next_cache_23_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_23_end_0 = const()[name = tensor("next_cache_23_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_23_end_mask_0 = const()[name = tensor("next_cache_23_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_23_cast_fp16 = slice_by_index(begin = next_cache_23_begin_0, end = next_cache_23_end_0, end_mask = next_cache_23_end_mask_0, x = new_x_47_cast_fp16)[name = tensor("next_cache_23_cast_fp16")]; tensor var_2711_begin_0 = const()[name = tensor("op_2711_begin_0"), val = tensor([0, 0, 1])]; tensor var_2711_end_0 = const()[name = tensor("op_2711_end_0"), val = tensor([1, 512, 9])]; tensor var_2711_end_mask_0 = const()[name = tensor("op_2711_end_mask_0"), val = tensor([true, true, true])]; tensor var_2711_cast_fp16 = slice_by_index(begin = var_2711_begin_0, end = var_2711_end_0, end_mask = var_2711_end_mask_0, x = next_cache_23_cast_fp16)[name = tensor("op_2711_cast_fp16")]; tensor x_307_pad_type_0 = const()[name = tensor("x_307_pad_type_0"), val = tensor("valid")]; tensor x_307_groups_0 = const()[name = tensor("x_307_groups_0"), val = tensor(512)]; tensor x_307_strides_0 = const()[name = tensor("x_307_strides_0"), val = tensor([1])]; tensor x_307_pad_0 = const()[name = tensor("x_307_pad_0"), val = tensor([0, 0])]; tensor x_307_dilations_0 = const()[name = tensor("x_307_dilations_0"), val = tensor([1])]; tensor encoder_layers_11_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_11_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146795584)))]; tensor x_307_cast_fp16 = conv(dilations = x_307_dilations_0, groups = x_307_groups_0, pad = x_307_pad_0, pad_type = x_307_pad_type_0, strides = x_307_strides_0, weight = encoder_layers_11_conv_depthwise_conv_weight_to_fp16, x = new_x_47_cast_fp16)[name = tensor("x_307_cast_fp16")]; tensor input_627_perm_0 = const()[name = tensor("input_627_perm_0"), val = tensor([0, 2, 1])]; tensor x_309_axes_0 = const()[name = tensor("x_309_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_11_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146804864)))]; tensor encoder_layers_11_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_11_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146805952)))]; tensor input_627_cast_fp16 = transpose(perm = input_627_perm_0, x = x_307_cast_fp16)[name = tensor("transpose_133")]; tensor x_309_cast_fp16 = layer_norm(axes = x_309_axes_0, beta = encoder_layers_11_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_conv_batch_norm_weight_to_fp16, x = input_627_cast_fp16)[name = tensor("x_309_cast_fp16")]; tensor input_629_perm_0 = const()[name = tensor("input_629_perm_0"), val = tensor([0, 2, 1])]; tensor input_629_cast_fp16 = transpose(perm = input_629_perm_0, x = x_309_cast_fp16)[name = tensor("transpose_132")]; tensor input_631_cast_fp16 = silu(x = input_629_cast_fp16)[name = tensor("input_631_cast_fp16")]; tensor x_311_pad_type_0 = const()[name = tensor("x_311_pad_type_0"), val = tensor("valid")]; tensor x_311_strides_0 = const()[name = tensor("x_311_strides_0"), val = tensor([1])]; tensor x_311_pad_0 = const()[name = tensor("x_311_pad_0"), val = tensor([0, 0])]; tensor x_311_dilations_0 = const()[name = tensor("x_311_dilations_0"), val = tensor([1])]; tensor x_311_groups_0 = const()[name = tensor("x_311_groups_0"), val = tensor(1)]; tensor encoder_layers_11_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146807040)))]; tensor x_311_cast_fp16 = conv(dilations = x_311_dilations_0, groups = x_311_groups_0, pad = x_311_pad_0, pad_type = x_311_pad_type_0, strides = x_311_strides_0, weight = encoder_layers_11_conv_pointwise_conv2_weight_to_fp16, x = input_631_cast_fp16)[name = tensor("x_311_cast_fp16")]; tensor input_633_perm_0 = const()[name = tensor("input_633_perm_0"), val = tensor([0, 2, 1])]; tensor input_633_cast_fp16 = transpose(perm = input_633_perm_0, x = x_311_cast_fp16)[name = tensor("transpose_131")]; tensor input_635_cast_fp16 = add(x = input_619_cast_fp16, y = input_633_cast_fp16)[name = tensor("input_635_cast_fp16")]; tensor input_637_axes_0 = const()[name = tensor("input_637_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(147331392)))]; tensor encoder_layers_11_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(147332480)))]; tensor input_637_cast_fp16 = layer_norm(axes = input_637_axes_0, beta = encoder_layers_11_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_norm_feed_forward2_weight_to_fp16, x = input_635_cast_fp16)[name = tensor("input_637_cast_fp16")]; tensor encoder_layers_11_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(147333568)))]; tensor linear_107_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_11_feed_forward2_linear1_weight_to_fp16, x = input_637_cast_fp16)[name = tensor("linear_107_cast_fp16")]; tensor input_641_cast_fp16 = silu(x = linear_107_cast_fp16)[name = tensor("input_641_cast_fp16")]; tensor encoder_layers_11_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_11_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149430784)))]; tensor linear_108_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_11_feed_forward2_linear2_weight_to_fp16, x = input_641_cast_fp16)[name = tensor("linear_108_cast_fp16")]; tensor var_2752_to_fp16 = const()[name = tensor("op_2752_to_fp16"), val = tensor(0x1p-1)]; tensor var_2753_cast_fp16 = mul(x = linear_108_cast_fp16, y = var_2752_to_fp16)[name = tensor("op_2753_cast_fp16")]; tensor input_647_cast_fp16 = add(x = input_635_cast_fp16, y = var_2753_cast_fp16)[name = tensor("input_647_cast_fp16")]; tensor input_649_axes_0 = const()[name = tensor("input_649_axes_0"), val = tensor([-1])]; tensor encoder_layers_11_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_11_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151528000)))]; tensor encoder_layers_11_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_11_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151529088)))]; tensor input_649_cast_fp16 = layer_norm(axes = input_649_axes_0, beta = encoder_layers_11_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_11_norm_out_weight_to_fp16, x = input_647_cast_fp16)[name = tensor("input_649_cast_fp16")]; tensor cache_49_begin_0 = const()[name = tensor("cache_49_begin_0"), val = tensor([12, 0, 0, 0])]; tensor cache_49_end_0 = const()[name = tensor("cache_49_end_0"), val = tensor([13, 1, 70, 512])]; tensor cache_49_end_mask_0 = const()[name = tensor("cache_49_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_49_squeeze_mask_0 = const()[name = tensor("cache_49_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_49_cast_fp16 = slice_by_index(begin = cache_49_begin_0, end = cache_49_end_0, end_mask = cache_49_end_mask_0, squeeze_mask = cache_49_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_49_cast_fp16")]; tensor cache_51_begin_0 = const()[name = tensor("cache_51_begin_0"), val = tensor([12, 0, 0, 0])]; tensor cache_51_end_0 = const()[name = tensor("cache_51_end_0"), val = tensor([13, 1, 512, 8])]; tensor cache_51_end_mask_0 = const()[name = tensor("cache_51_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_51_squeeze_mask_0 = const()[name = tensor("cache_51_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_51_cast_fp16 = slice_by_index(begin = cache_51_begin_0, end = cache_51_end_0, end_mask = cache_51_end_mask_0, squeeze_mask = cache_51_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_51_cast_fp16")]; tensor input_651_axes_0 = const()[name = tensor("input_651_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151530176)))]; tensor encoder_layers_12_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151531264)))]; tensor input_651_cast_fp16 = layer_norm(axes = input_651_axes_0, beta = encoder_layers_12_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_norm_feed_forward1_weight_to_fp16, x = input_649_cast_fp16)[name = tensor("input_651_cast_fp16")]; tensor encoder_layers_12_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151532352)))]; tensor linear_109_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_12_feed_forward1_linear1_weight_to_fp16, x = input_651_cast_fp16)[name = tensor("linear_109_cast_fp16")]; tensor input_655_cast_fp16 = silu(x = linear_109_cast_fp16)[name = tensor("input_655_cast_fp16")]; tensor encoder_layers_12_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153629568)))]; tensor linear_110_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_feed_forward1_linear2_weight_to_fp16, x = input_655_cast_fp16)[name = tensor("linear_110_cast_fp16")]; tensor var_2787_to_fp16 = const()[name = tensor("op_2787_to_fp16"), val = tensor(0x1p-1)]; tensor var_2788_cast_fp16 = mul(x = linear_110_cast_fp16, y = var_2787_to_fp16)[name = tensor("op_2788_cast_fp16")]; tensor input_661_cast_fp16 = add(x = input_649_cast_fp16, y = var_2788_cast_fp16)[name = tensor("input_661_cast_fp16")]; tensor key_25_axes_0 = const()[name = tensor("key_25_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155726784)))]; tensor encoder_layers_12_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155727872)))]; tensor key_25_cast_fp16 = layer_norm(axes = key_25_axes_0, beta = encoder_layers_12_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_norm_self_att_weight_to_fp16, x = input_661_cast_fp16)[name = tensor("key_25_cast_fp16")]; tensor input_663_interleave_0 = const()[name = tensor("input_663_interleave_0"), val = tensor(false)]; tensor input_663_cast_fp16 = concat(axis = var_64, interleave = input_663_interleave_0, values = (cache_49_cast_fp16, key_25_cast_fp16))[name = tensor("input_663_cast_fp16")]; tensor var_2810_begin_0 = const()[name = tensor("op_2810_begin_0"), val = tensor([0, 1, 0])]; tensor var_2810_end_0 = const()[name = tensor("op_2810_end_0"), val = tensor([1, 70, 512])]; tensor var_2810_end_mask_0 = const()[name = tensor("op_2810_end_mask_0"), val = tensor([true, true, true])]; tensor var_2810_cast_fp16 = slice_by_index(begin = var_2810_begin_0, end = var_2810_end_0, end_mask = var_2810_end_mask_0, x = cache_49_cast_fp16)[name = tensor("op_2810_cast_fp16")]; tensor var_2813_begin_0 = const()[name = tensor("op_2813_begin_0"), val = tensor([0, 0, 0])]; tensor var_2813_end_0 = const()[name = tensor("op_2813_end_0"), val = tensor([1, 1, 512])]; tensor var_2813_end_mask_0 = const()[name = tensor("op_2813_end_mask_0"), val = tensor([true, false, true])]; tensor var_2813_cast_fp16 = slice_by_index(begin = var_2813_begin_0, end = var_2813_end_0, end_mask = var_2813_end_mask_0, x = key_25_cast_fp16)[name = tensor("op_2813_cast_fp16")]; tensor var_2816_interleave_0 = const()[name = tensor("op_2816_interleave_0"), val = tensor(false)]; tensor var_2816_cast_fp16 = concat(axis = var_64, interleave = var_2816_interleave_0, values = (var_2810_cast_fp16, var_2813_cast_fp16))[name = tensor("op_2816_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(155728960)))]; tensor linear_111_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_self_attn_linear_q_weight_to_fp16, x = key_25_cast_fp16)[name = tensor("linear_111_cast_fp16")]; tensor var_2820 = const()[name = tensor("op_2820"), val = tensor([1, -1, 8, 64])]; tensor q_73_cast_fp16 = reshape(shape = var_2820, x = linear_111_cast_fp16)[name = tensor("q_73_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156253312)))]; tensor linear_112_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_self_attn_linear_k_weight_to_fp16, x = input_663_cast_fp16)[name = tensor("linear_112_cast_fp16")]; tensor var_2824 = const()[name = tensor("op_2824"), val = tensor([1, -1, 8, 64])]; tensor k_49_cast_fp16 = reshape(shape = var_2824, x = linear_112_cast_fp16)[name = tensor("k_49_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156777664)))]; tensor linear_113_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_self_attn_linear_v_weight_to_fp16, x = input_663_cast_fp16)[name = tensor("linear_113_cast_fp16")]; tensor var_2828 = const()[name = tensor("op_2828"), val = tensor([1, -1, 8, 64])]; tensor v_25_cast_fp16 = reshape(shape = var_2828, x = linear_113_cast_fp16)[name = tensor("v_25_cast_fp16")]; tensor value_27_perm_0 = const()[name = tensor("value_27_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_12_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157302016)))]; tensor var_2840_cast_fp16 = add(x = q_73_cast_fp16, y = encoder_layers_12_self_attn_pos_bias_u_to_fp16)[name = tensor("op_2840_cast_fp16")]; tensor encoder_layers_12_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157303104)))]; tensor var_2842_cast_fp16 = add(x = q_73_cast_fp16, y = encoder_layers_12_self_attn_pos_bias_v_to_fp16)[name = tensor("op_2842_cast_fp16")]; tensor q_with_bias_v_25_perm_0 = const()[name = tensor("q_with_bias_v_25_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_319_transpose_x_0 = const()[name = tensor("x_319_transpose_x_0"), val = tensor(false)]; tensor x_319_transpose_y_0 = const()[name = tensor("x_319_transpose_y_0"), val = tensor(false)]; tensor var_2844_to_fp16 = const()[name = tensor("op_2844_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157304192)))]; tensor q_with_bias_v_25_cast_fp16 = transpose(perm = q_with_bias_v_25_perm_0, x = var_2842_cast_fp16)[name = tensor("transpose_129")]; tensor x_319_cast_fp16 = matmul(transpose_x = x_319_transpose_x_0, transpose_y = x_319_transpose_y_0, x = q_with_bias_v_25_cast_fp16, y = var_2844_to_fp16)[name = tensor("x_319_cast_fp16")]; tensor x_321_pad_0 = const()[name = tensor("x_321_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_321_mode_0 = const()[name = tensor("x_321_mode_0"), val = tensor("constant")]; tensor const_179_to_fp16 = const()[name = tensor("const_179_to_fp16"), val = tensor(0x0p+0)]; tensor x_321_cast_fp16 = pad(constant_val = const_179_to_fp16, mode = x_321_mode_0, pad = x_321_pad_0, x = x_319_cast_fp16)[name = tensor("x_321_cast_fp16")]; tensor var_2852 = const()[name = tensor("op_2852"), val = tensor([1, 8, -1, 3])]; tensor x_323_cast_fp16 = reshape(shape = var_2852, x = x_321_cast_fp16)[name = tensor("x_323_cast_fp16")]; tensor var_2856_begin_0 = const()[name = tensor("op_2856_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_2856_end_0 = const()[name = tensor("op_2856_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_2856_end_mask_0 = const()[name = tensor("op_2856_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_2856_cast_fp16 = slice_by_index(begin = var_2856_begin_0, end = var_2856_end_0, end_mask = var_2856_end_mask_0, x = x_323_cast_fp16)[name = tensor("op_2856_cast_fp16")]; tensor var_2857 = const()[name = tensor("op_2857"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_49_cast_fp16 = reshape(shape = var_2857, x = var_2856_cast_fp16)[name = tensor("matrix_bd_49_cast_fp16")]; tensor matrix_ac_25_transpose_x_0 = const()[name = tensor("matrix_ac_25_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_25_transpose_y_0 = const()[name = tensor("matrix_ac_25_transpose_y_0"), val = tensor(false)]; tensor transpose_75_perm_0 = const()[name = tensor("transpose_75_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_76_perm_0 = const()[name = tensor("transpose_76_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_76 = transpose(perm = transpose_76_perm_0, x = k_49_cast_fp16)[name = tensor("transpose_127")]; tensor transpose_75 = transpose(perm = transpose_75_perm_0, x = var_2840_cast_fp16)[name = tensor("transpose_128")]; tensor matrix_ac_25_cast_fp16 = matmul(transpose_x = matrix_ac_25_transpose_x_0, transpose_y = matrix_ac_25_transpose_y_0, x = transpose_75, y = transpose_76)[name = tensor("matrix_ac_25_cast_fp16")]; tensor matrix_bd_51_begin_0 = const()[name = tensor("matrix_bd_51_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_51_end_0 = const()[name = tensor("matrix_bd_51_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_51_end_mask_0 = const()[name = tensor("matrix_bd_51_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_51_cast_fp16 = slice_by_index(begin = matrix_bd_51_begin_0, end = matrix_bd_51_end_0, end_mask = matrix_bd_51_end_mask_0, x = matrix_bd_49_cast_fp16)[name = tensor("matrix_bd_51_cast_fp16")]; tensor var_2866_cast_fp16 = add(x = matrix_ac_25_cast_fp16, y = matrix_bd_51_cast_fp16)[name = tensor("op_2866_cast_fp16")]; tensor _inversed_scores_49_y_0_to_fp16 = const()[name = tensor("_inversed_scores_49_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_49_cast_fp16 = mul(x = var_2866_cast_fp16, y = _inversed_scores_49_y_0_to_fp16)[name = tensor("_inversed_scores_49_cast_fp16")]; tensor scores_51_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_49_cast_fp16, cond = mask_3)[name = tensor("scores_51_cast_fp16")]; tensor var_2872_cast_fp16 = softmax(axis = var_62, x = scores_51_cast_fp16)[name = tensor("op_2872_cast_fp16")]; tensor input_665_cast_fp16 = select(a = var_40_to_fp16, b = var_2872_cast_fp16, cond = mask_3)[name = tensor("input_665_cast_fp16")]; tensor x_325_transpose_x_0 = const()[name = tensor("x_325_transpose_x_0"), val = tensor(false)]; tensor x_325_transpose_y_0 = const()[name = tensor("x_325_transpose_y_0"), val = tensor(false)]; tensor value_27_cast_fp16 = transpose(perm = value_27_perm_0, x = v_25_cast_fp16)[name = tensor("transpose_130")]; tensor x_325_cast_fp16 = matmul(transpose_x = x_325_transpose_x_0, transpose_y = x_325_transpose_y_0, x = input_665_cast_fp16, y = value_27_cast_fp16)[name = tensor("x_325_cast_fp16")]; tensor var_2876_perm_0 = const()[name = tensor("op_2876_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_2877 = const()[name = tensor("op_2877"), val = tensor([1, -1, 512])]; tensor var_2876_cast_fp16 = transpose(perm = var_2876_perm_0, x = x_325_cast_fp16)[name = tensor("transpose_126")]; tensor input_667_cast_fp16 = reshape(shape = var_2877, x = var_2876_cast_fp16)[name = tensor("input_667_cast_fp16")]; tensor encoder_layers_12_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_12_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157452736)))]; tensor linear_115_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_self_attn_linear_out_weight_to_fp16, x = input_667_cast_fp16)[name = tensor("linear_115_cast_fp16")]; tensor input_671_cast_fp16 = add(x = input_661_cast_fp16, y = linear_115_cast_fp16)[name = tensor("input_671_cast_fp16")]; tensor x_329_axes_0 = const()[name = tensor("x_329_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157977088)))]; tensor encoder_layers_12_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157978176)))]; tensor x_329_cast_fp16 = layer_norm(axes = x_329_axes_0, beta = encoder_layers_12_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_norm_conv_weight_to_fp16, x = input_671_cast_fp16)[name = tensor("x_329_cast_fp16")]; tensor input_673_perm_0 = const()[name = tensor("input_673_perm_0"), val = tensor([0, 2, 1])]; tensor input_675_pad_type_0 = const()[name = tensor("input_675_pad_type_0"), val = tensor("valid")]; tensor input_675_strides_0 = const()[name = tensor("input_675_strides_0"), val = tensor([1])]; tensor input_675_pad_0 = const()[name = tensor("input_675_pad_0"), val = tensor([0, 0])]; tensor input_675_dilations_0 = const()[name = tensor("input_675_dilations_0"), val = tensor([1])]; tensor input_675_groups_0 = const()[name = tensor("input_675_groups_0"), val = tensor(1)]; tensor encoder_layers_12_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157979264)))]; tensor input_673_cast_fp16 = transpose(perm = input_673_perm_0, x = x_329_cast_fp16)[name = tensor("transpose_125")]; tensor input_675_cast_fp16 = conv(dilations = input_675_dilations_0, groups = input_675_groups_0, pad = input_675_pad_0, pad_type = input_675_pad_type_0, strides = input_675_strides_0, weight = encoder_layers_12_conv_pointwise_conv1_weight_to_fp16, x = input_673_cast_fp16)[name = tensor("input_675_cast_fp16")]; tensor x_331_split_num_splits_0 = const()[name = tensor("x_331_split_num_splits_0"), val = tensor(2)]; tensor x_331_split_axis_0 = const()[name = tensor("x_331_split_axis_0"), val = tensor(1)]; tensor x_331_split_cast_fp16_0, tensor x_331_split_cast_fp16_1 = split(axis = x_331_split_axis_0, num_splits = x_331_split_num_splits_0, x = input_675_cast_fp16)[name = tensor("x_331_split_cast_fp16")]; tensor x_331_split_1_sigmoid_cast_fp16 = sigmoid(x = x_331_split_cast_fp16_1)[name = tensor("x_331_split_1_sigmoid_cast_fp16")]; tensor x_331_cast_fp16 = mul(x = x_331_split_cast_fp16_0, y = x_331_split_1_sigmoid_cast_fp16)[name = tensor("x_331_cast_fp16")]; tensor input_677_cast_fp16 = select(a = var_40_to_fp16, b = x_331_cast_fp16, cond = var_418)[name = tensor("input_677_cast_fp16")]; tensor new_x_51_interleave_0 = const()[name = tensor("new_x_51_interleave_0"), val = tensor(false)]; tensor new_x_51_cast_fp16 = concat(axis = var_62, interleave = new_x_51_interleave_0, values = (cache_51_cast_fp16, input_677_cast_fp16))[name = tensor("new_x_51_cast_fp16")]; tensor next_cache_25_begin_0 = const()[name = tensor("next_cache_25_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_25_end_0 = const()[name = tensor("next_cache_25_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_25_end_mask_0 = const()[name = tensor("next_cache_25_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_25_cast_fp16 = slice_by_index(begin = next_cache_25_begin_0, end = next_cache_25_end_0, end_mask = next_cache_25_end_mask_0, x = new_x_51_cast_fp16)[name = tensor("next_cache_25_cast_fp16")]; tensor var_2918_begin_0 = const()[name = tensor("op_2918_begin_0"), val = tensor([0, 0, 1])]; tensor var_2918_end_0 = const()[name = tensor("op_2918_end_0"), val = tensor([1, 512, 9])]; tensor var_2918_end_mask_0 = const()[name = tensor("op_2918_end_mask_0"), val = tensor([true, true, true])]; tensor var_2918_cast_fp16 = slice_by_index(begin = var_2918_begin_0, end = var_2918_end_0, end_mask = var_2918_end_mask_0, x = next_cache_25_cast_fp16)[name = tensor("op_2918_cast_fp16")]; tensor x_333_pad_type_0 = const()[name = tensor("x_333_pad_type_0"), val = tensor("valid")]; tensor x_333_groups_0 = const()[name = tensor("x_333_groups_0"), val = tensor(512)]; tensor x_333_strides_0 = const()[name = tensor("x_333_strides_0"), val = tensor([1])]; tensor x_333_pad_0 = const()[name = tensor("x_333_pad_0"), val = tensor([0, 0])]; tensor x_333_dilations_0 = const()[name = tensor("x_333_dilations_0"), val = tensor([1])]; tensor encoder_layers_12_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_12_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159027904)))]; tensor x_333_cast_fp16 = conv(dilations = x_333_dilations_0, groups = x_333_groups_0, pad = x_333_pad_0, pad_type = x_333_pad_type_0, strides = x_333_strides_0, weight = encoder_layers_12_conv_depthwise_conv_weight_to_fp16, x = new_x_51_cast_fp16)[name = tensor("x_333_cast_fp16")]; tensor input_679_perm_0 = const()[name = tensor("input_679_perm_0"), val = tensor([0, 2, 1])]; tensor x_335_axes_0 = const()[name = tensor("x_335_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_12_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159037184)))]; tensor encoder_layers_12_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_12_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159038272)))]; tensor input_679_cast_fp16 = transpose(perm = input_679_perm_0, x = x_333_cast_fp16)[name = tensor("transpose_124")]; tensor x_335_cast_fp16 = layer_norm(axes = x_335_axes_0, beta = encoder_layers_12_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_conv_batch_norm_weight_to_fp16, x = input_679_cast_fp16)[name = tensor("x_335_cast_fp16")]; tensor input_681_perm_0 = const()[name = tensor("input_681_perm_0"), val = tensor([0, 2, 1])]; tensor input_681_cast_fp16 = transpose(perm = input_681_perm_0, x = x_335_cast_fp16)[name = tensor("transpose_123")]; tensor input_683_cast_fp16 = silu(x = input_681_cast_fp16)[name = tensor("input_683_cast_fp16")]; tensor x_337_pad_type_0 = const()[name = tensor("x_337_pad_type_0"), val = tensor("valid")]; tensor x_337_strides_0 = const()[name = tensor("x_337_strides_0"), val = tensor([1])]; tensor x_337_pad_0 = const()[name = tensor("x_337_pad_0"), val = tensor([0, 0])]; tensor x_337_dilations_0 = const()[name = tensor("x_337_dilations_0"), val = tensor([1])]; tensor x_337_groups_0 = const()[name = tensor("x_337_groups_0"), val = tensor(1)]; tensor encoder_layers_12_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159039360)))]; tensor x_337_cast_fp16 = conv(dilations = x_337_dilations_0, groups = x_337_groups_0, pad = x_337_pad_0, pad_type = x_337_pad_type_0, strides = x_337_strides_0, weight = encoder_layers_12_conv_pointwise_conv2_weight_to_fp16, x = input_683_cast_fp16)[name = tensor("x_337_cast_fp16")]; tensor input_685_perm_0 = const()[name = tensor("input_685_perm_0"), val = tensor([0, 2, 1])]; tensor input_685_cast_fp16 = transpose(perm = input_685_perm_0, x = x_337_cast_fp16)[name = tensor("transpose_122")]; tensor input_687_cast_fp16 = add(x = input_671_cast_fp16, y = input_685_cast_fp16)[name = tensor("input_687_cast_fp16")]; tensor input_689_axes_0 = const()[name = tensor("input_689_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159563712)))]; tensor encoder_layers_12_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159564800)))]; tensor input_689_cast_fp16 = layer_norm(axes = input_689_axes_0, beta = encoder_layers_12_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_norm_feed_forward2_weight_to_fp16, x = input_687_cast_fp16)[name = tensor("input_689_cast_fp16")]; tensor encoder_layers_12_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159565888)))]; tensor linear_116_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_12_feed_forward2_linear1_weight_to_fp16, x = input_689_cast_fp16)[name = tensor("linear_116_cast_fp16")]; tensor input_693_cast_fp16 = silu(x = linear_116_cast_fp16)[name = tensor("input_693_cast_fp16")]; tensor encoder_layers_12_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_12_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161663104)))]; tensor linear_117_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_12_feed_forward2_linear2_weight_to_fp16, x = input_693_cast_fp16)[name = tensor("linear_117_cast_fp16")]; tensor var_2959_to_fp16 = const()[name = tensor("op_2959_to_fp16"), val = tensor(0x1p-1)]; tensor var_2960_cast_fp16 = mul(x = linear_117_cast_fp16, y = var_2959_to_fp16)[name = tensor("op_2960_cast_fp16")]; tensor input_699_cast_fp16 = add(x = input_687_cast_fp16, y = var_2960_cast_fp16)[name = tensor("input_699_cast_fp16")]; tensor input_701_axes_0 = const()[name = tensor("input_701_axes_0"), val = tensor([-1])]; tensor encoder_layers_12_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_12_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163760320)))]; tensor encoder_layers_12_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_12_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163761408)))]; tensor input_701_cast_fp16 = layer_norm(axes = input_701_axes_0, beta = encoder_layers_12_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_12_norm_out_weight_to_fp16, x = input_699_cast_fp16)[name = tensor("input_701_cast_fp16")]; tensor cache_53_begin_0 = const()[name = tensor("cache_53_begin_0"), val = tensor([13, 0, 0, 0])]; tensor cache_53_end_0 = const()[name = tensor("cache_53_end_0"), val = tensor([14, 1, 70, 512])]; tensor cache_53_end_mask_0 = const()[name = tensor("cache_53_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_53_squeeze_mask_0 = const()[name = tensor("cache_53_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_53_cast_fp16 = slice_by_index(begin = cache_53_begin_0, end = cache_53_end_0, end_mask = cache_53_end_mask_0, squeeze_mask = cache_53_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_53_cast_fp16")]; tensor cache_55_begin_0 = const()[name = tensor("cache_55_begin_0"), val = tensor([13, 0, 0, 0])]; tensor cache_55_end_0 = const()[name = tensor("cache_55_end_0"), val = tensor([14, 1, 512, 8])]; tensor cache_55_end_mask_0 = const()[name = tensor("cache_55_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_55_squeeze_mask_0 = const()[name = tensor("cache_55_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_55_cast_fp16 = slice_by_index(begin = cache_55_begin_0, end = cache_55_end_0, end_mask = cache_55_end_mask_0, squeeze_mask = cache_55_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_55_cast_fp16")]; tensor input_703_axes_0 = const()[name = tensor("input_703_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163762496)))]; tensor encoder_layers_13_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163763584)))]; tensor input_703_cast_fp16 = layer_norm(axes = input_703_axes_0, beta = encoder_layers_13_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_norm_feed_forward1_weight_to_fp16, x = input_701_cast_fp16)[name = tensor("input_703_cast_fp16")]; tensor encoder_layers_13_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163764672)))]; tensor linear_118_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_13_feed_forward1_linear1_weight_to_fp16, x = input_703_cast_fp16)[name = tensor("linear_118_cast_fp16")]; tensor input_707_cast_fp16 = silu(x = linear_118_cast_fp16)[name = tensor("input_707_cast_fp16")]; tensor encoder_layers_13_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165861888)))]; tensor linear_119_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_feed_forward1_linear2_weight_to_fp16, x = input_707_cast_fp16)[name = tensor("linear_119_cast_fp16")]; tensor var_2994_to_fp16 = const()[name = tensor("op_2994_to_fp16"), val = tensor(0x1p-1)]; tensor var_2995_cast_fp16 = mul(x = linear_119_cast_fp16, y = var_2994_to_fp16)[name = tensor("op_2995_cast_fp16")]; tensor input_713_cast_fp16 = add(x = input_701_cast_fp16, y = var_2995_cast_fp16)[name = tensor("input_713_cast_fp16")]; tensor key_27_axes_0 = const()[name = tensor("key_27_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167959104)))]; tensor encoder_layers_13_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167960192)))]; tensor key_27_cast_fp16 = layer_norm(axes = key_27_axes_0, beta = encoder_layers_13_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_norm_self_att_weight_to_fp16, x = input_713_cast_fp16)[name = tensor("key_27_cast_fp16")]; tensor input_715_interleave_0 = const()[name = tensor("input_715_interleave_0"), val = tensor(false)]; tensor input_715_cast_fp16 = concat(axis = var_64, interleave = input_715_interleave_0, values = (cache_53_cast_fp16, key_27_cast_fp16))[name = tensor("input_715_cast_fp16")]; tensor var_3017_begin_0 = const()[name = tensor("op_3017_begin_0"), val = tensor([0, 1, 0])]; tensor var_3017_end_0 = const()[name = tensor("op_3017_end_0"), val = tensor([1, 70, 512])]; tensor var_3017_end_mask_0 = const()[name = tensor("op_3017_end_mask_0"), val = tensor([true, true, true])]; tensor var_3017_cast_fp16 = slice_by_index(begin = var_3017_begin_0, end = var_3017_end_0, end_mask = var_3017_end_mask_0, x = cache_53_cast_fp16)[name = tensor("op_3017_cast_fp16")]; tensor var_3020_begin_0 = const()[name = tensor("op_3020_begin_0"), val = tensor([0, 0, 0])]; tensor var_3020_end_0 = const()[name = tensor("op_3020_end_0"), val = tensor([1, 1, 512])]; tensor var_3020_end_mask_0 = const()[name = tensor("op_3020_end_mask_0"), val = tensor([true, false, true])]; tensor var_3020_cast_fp16 = slice_by_index(begin = var_3020_begin_0, end = var_3020_end_0, end_mask = var_3020_end_mask_0, x = key_27_cast_fp16)[name = tensor("op_3020_cast_fp16")]; tensor var_3023_interleave_0 = const()[name = tensor("op_3023_interleave_0"), val = tensor(false)]; tensor var_3023_cast_fp16 = concat(axis = var_64, interleave = var_3023_interleave_0, values = (var_3017_cast_fp16, var_3020_cast_fp16))[name = tensor("op_3023_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167961280)))]; tensor linear_120_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_self_attn_linear_q_weight_to_fp16, x = key_27_cast_fp16)[name = tensor("linear_120_cast_fp16")]; tensor var_3027 = const()[name = tensor("op_3027"), val = tensor([1, -1, 8, 64])]; tensor q_79_cast_fp16 = reshape(shape = var_3027, x = linear_120_cast_fp16)[name = tensor("q_79_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(168485632)))]; tensor linear_121_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_self_attn_linear_k_weight_to_fp16, x = input_715_cast_fp16)[name = tensor("linear_121_cast_fp16")]; tensor var_3031 = const()[name = tensor("op_3031"), val = tensor([1, -1, 8, 64])]; tensor k_53_cast_fp16 = reshape(shape = var_3031, x = linear_121_cast_fp16)[name = tensor("k_53_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169009984)))]; tensor linear_122_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_self_attn_linear_v_weight_to_fp16, x = input_715_cast_fp16)[name = tensor("linear_122_cast_fp16")]; tensor var_3035 = const()[name = tensor("op_3035"), val = tensor([1, -1, 8, 64])]; tensor v_27_cast_fp16 = reshape(shape = var_3035, x = linear_122_cast_fp16)[name = tensor("v_27_cast_fp16")]; tensor value_29_perm_0 = const()[name = tensor("value_29_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_13_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169534336)))]; tensor var_3047_cast_fp16 = add(x = q_79_cast_fp16, y = encoder_layers_13_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3047_cast_fp16")]; tensor encoder_layers_13_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169535424)))]; tensor var_3049_cast_fp16 = add(x = q_79_cast_fp16, y = encoder_layers_13_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3049_cast_fp16")]; tensor q_with_bias_v_27_perm_0 = const()[name = tensor("q_with_bias_v_27_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_345_transpose_x_0 = const()[name = tensor("x_345_transpose_x_0"), val = tensor(false)]; tensor x_345_transpose_y_0 = const()[name = tensor("x_345_transpose_y_0"), val = tensor(false)]; tensor var_3051_to_fp16 = const()[name = tensor("op_3051_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169536512)))]; tensor q_with_bias_v_27_cast_fp16 = transpose(perm = q_with_bias_v_27_perm_0, x = var_3049_cast_fp16)[name = tensor("transpose_120")]; tensor x_345_cast_fp16 = matmul(transpose_x = x_345_transpose_x_0, transpose_y = x_345_transpose_y_0, x = q_with_bias_v_27_cast_fp16, y = var_3051_to_fp16)[name = tensor("x_345_cast_fp16")]; tensor x_347_pad_0 = const()[name = tensor("x_347_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_347_mode_0 = const()[name = tensor("x_347_mode_0"), val = tensor("constant")]; tensor const_192_to_fp16 = const()[name = tensor("const_192_to_fp16"), val = tensor(0x0p+0)]; tensor x_347_cast_fp16 = pad(constant_val = const_192_to_fp16, mode = x_347_mode_0, pad = x_347_pad_0, x = x_345_cast_fp16)[name = tensor("x_347_cast_fp16")]; tensor var_3059 = const()[name = tensor("op_3059"), val = tensor([1, 8, -1, 3])]; tensor x_349_cast_fp16 = reshape(shape = var_3059, x = x_347_cast_fp16)[name = tensor("x_349_cast_fp16")]; tensor var_3063_begin_0 = const()[name = tensor("op_3063_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3063_end_0 = const()[name = tensor("op_3063_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_3063_end_mask_0 = const()[name = tensor("op_3063_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3063_cast_fp16 = slice_by_index(begin = var_3063_begin_0, end = var_3063_end_0, end_mask = var_3063_end_mask_0, x = x_349_cast_fp16)[name = tensor("op_3063_cast_fp16")]; tensor var_3064 = const()[name = tensor("op_3064"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_53_cast_fp16 = reshape(shape = var_3064, x = var_3063_cast_fp16)[name = tensor("matrix_bd_53_cast_fp16")]; tensor matrix_ac_27_transpose_x_0 = const()[name = tensor("matrix_ac_27_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_27_transpose_y_0 = const()[name = tensor("matrix_ac_27_transpose_y_0"), val = tensor(false)]; tensor transpose_77_perm_0 = const()[name = tensor("transpose_77_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_78_perm_0 = const()[name = tensor("transpose_78_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_78 = transpose(perm = transpose_78_perm_0, x = k_53_cast_fp16)[name = tensor("transpose_118")]; tensor transpose_77 = transpose(perm = transpose_77_perm_0, x = var_3047_cast_fp16)[name = tensor("transpose_119")]; tensor matrix_ac_27_cast_fp16 = matmul(transpose_x = matrix_ac_27_transpose_x_0, transpose_y = matrix_ac_27_transpose_y_0, x = transpose_77, y = transpose_78)[name = tensor("matrix_ac_27_cast_fp16")]; tensor matrix_bd_55_begin_0 = const()[name = tensor("matrix_bd_55_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_55_end_0 = const()[name = tensor("matrix_bd_55_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_55_end_mask_0 = const()[name = tensor("matrix_bd_55_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_55_cast_fp16 = slice_by_index(begin = matrix_bd_55_begin_0, end = matrix_bd_55_end_0, end_mask = matrix_bd_55_end_mask_0, x = matrix_bd_53_cast_fp16)[name = tensor("matrix_bd_55_cast_fp16")]; tensor var_3073_cast_fp16 = add(x = matrix_ac_27_cast_fp16, y = matrix_bd_55_cast_fp16)[name = tensor("op_3073_cast_fp16")]; tensor _inversed_scores_53_y_0_to_fp16 = const()[name = tensor("_inversed_scores_53_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_53_cast_fp16 = mul(x = var_3073_cast_fp16, y = _inversed_scores_53_y_0_to_fp16)[name = tensor("_inversed_scores_53_cast_fp16")]; tensor scores_55_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_53_cast_fp16, cond = mask_3)[name = tensor("scores_55_cast_fp16")]; tensor var_3079_cast_fp16 = softmax(axis = var_62, x = scores_55_cast_fp16)[name = tensor("op_3079_cast_fp16")]; tensor input_717_cast_fp16 = select(a = var_40_to_fp16, b = var_3079_cast_fp16, cond = mask_3)[name = tensor("input_717_cast_fp16")]; tensor x_351_transpose_x_0 = const()[name = tensor("x_351_transpose_x_0"), val = tensor(false)]; tensor x_351_transpose_y_0 = const()[name = tensor("x_351_transpose_y_0"), val = tensor(false)]; tensor value_29_cast_fp16 = transpose(perm = value_29_perm_0, x = v_27_cast_fp16)[name = tensor("transpose_121")]; tensor x_351_cast_fp16 = matmul(transpose_x = x_351_transpose_x_0, transpose_y = x_351_transpose_y_0, x = input_717_cast_fp16, y = value_29_cast_fp16)[name = tensor("x_351_cast_fp16")]; tensor var_3083_perm_0 = const()[name = tensor("op_3083_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3084 = const()[name = tensor("op_3084"), val = tensor([1, -1, 512])]; tensor var_3083_cast_fp16 = transpose(perm = var_3083_perm_0, x = x_351_cast_fp16)[name = tensor("transpose_117")]; tensor input_719_cast_fp16 = reshape(shape = var_3084, x = var_3083_cast_fp16)[name = tensor("input_719_cast_fp16")]; tensor encoder_layers_13_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_13_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169685056)))]; tensor linear_124_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_self_attn_linear_out_weight_to_fp16, x = input_719_cast_fp16)[name = tensor("linear_124_cast_fp16")]; tensor input_723_cast_fp16 = add(x = input_713_cast_fp16, y = linear_124_cast_fp16)[name = tensor("input_723_cast_fp16")]; tensor x_355_axes_0 = const()[name = tensor("x_355_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170209408)))]; tensor encoder_layers_13_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170210496)))]; tensor x_355_cast_fp16 = layer_norm(axes = x_355_axes_0, beta = encoder_layers_13_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_norm_conv_weight_to_fp16, x = input_723_cast_fp16)[name = tensor("x_355_cast_fp16")]; tensor input_725_perm_0 = const()[name = tensor("input_725_perm_0"), val = tensor([0, 2, 1])]; tensor input_727_pad_type_0 = const()[name = tensor("input_727_pad_type_0"), val = tensor("valid")]; tensor input_727_strides_0 = const()[name = tensor("input_727_strides_0"), val = tensor([1])]; tensor input_727_pad_0 = const()[name = tensor("input_727_pad_0"), val = tensor([0, 0])]; tensor input_727_dilations_0 = const()[name = tensor("input_727_dilations_0"), val = tensor([1])]; tensor input_727_groups_0 = const()[name = tensor("input_727_groups_0"), val = tensor(1)]; tensor encoder_layers_13_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(170211584)))]; tensor input_725_cast_fp16 = transpose(perm = input_725_perm_0, x = x_355_cast_fp16)[name = tensor("transpose_116")]; tensor input_727_cast_fp16 = conv(dilations = input_727_dilations_0, groups = input_727_groups_0, pad = input_727_pad_0, pad_type = input_727_pad_type_0, strides = input_727_strides_0, weight = encoder_layers_13_conv_pointwise_conv1_weight_to_fp16, x = input_725_cast_fp16)[name = tensor("input_727_cast_fp16")]; tensor x_357_split_num_splits_0 = const()[name = tensor("x_357_split_num_splits_0"), val = tensor(2)]; tensor x_357_split_axis_0 = const()[name = tensor("x_357_split_axis_0"), val = tensor(1)]; tensor x_357_split_cast_fp16_0, tensor x_357_split_cast_fp16_1 = split(axis = x_357_split_axis_0, num_splits = x_357_split_num_splits_0, x = input_727_cast_fp16)[name = tensor("x_357_split_cast_fp16")]; tensor x_357_split_1_sigmoid_cast_fp16 = sigmoid(x = x_357_split_cast_fp16_1)[name = tensor("x_357_split_1_sigmoid_cast_fp16")]; tensor x_357_cast_fp16 = mul(x = x_357_split_cast_fp16_0, y = x_357_split_1_sigmoid_cast_fp16)[name = tensor("x_357_cast_fp16")]; tensor input_729_cast_fp16 = select(a = var_40_to_fp16, b = x_357_cast_fp16, cond = var_418)[name = tensor("input_729_cast_fp16")]; tensor new_x_55_interleave_0 = const()[name = tensor("new_x_55_interleave_0"), val = tensor(false)]; tensor new_x_55_cast_fp16 = concat(axis = var_62, interleave = new_x_55_interleave_0, values = (cache_55_cast_fp16, input_729_cast_fp16))[name = tensor("new_x_55_cast_fp16")]; tensor next_cache_27_begin_0 = const()[name = tensor("next_cache_27_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_27_end_0 = const()[name = tensor("next_cache_27_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_27_end_mask_0 = const()[name = tensor("next_cache_27_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_27_cast_fp16 = slice_by_index(begin = next_cache_27_begin_0, end = next_cache_27_end_0, end_mask = next_cache_27_end_mask_0, x = new_x_55_cast_fp16)[name = tensor("next_cache_27_cast_fp16")]; tensor var_3125_begin_0 = const()[name = tensor("op_3125_begin_0"), val = tensor([0, 0, 1])]; tensor var_3125_end_0 = const()[name = tensor("op_3125_end_0"), val = tensor([1, 512, 9])]; tensor var_3125_end_mask_0 = const()[name = tensor("op_3125_end_mask_0"), val = tensor([true, true, true])]; tensor var_3125_cast_fp16 = slice_by_index(begin = var_3125_begin_0, end = var_3125_end_0, end_mask = var_3125_end_mask_0, x = next_cache_27_cast_fp16)[name = tensor("op_3125_cast_fp16")]; tensor x_359_pad_type_0 = const()[name = tensor("x_359_pad_type_0"), val = tensor("valid")]; tensor x_359_groups_0 = const()[name = tensor("x_359_groups_0"), val = tensor(512)]; tensor x_359_strides_0 = const()[name = tensor("x_359_strides_0"), val = tensor([1])]; tensor x_359_pad_0 = const()[name = tensor("x_359_pad_0"), val = tensor([0, 0])]; tensor x_359_dilations_0 = const()[name = tensor("x_359_dilations_0"), val = tensor([1])]; tensor encoder_layers_13_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_13_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171260224)))]; tensor x_359_cast_fp16 = conv(dilations = x_359_dilations_0, groups = x_359_groups_0, pad = x_359_pad_0, pad_type = x_359_pad_type_0, strides = x_359_strides_0, weight = encoder_layers_13_conv_depthwise_conv_weight_to_fp16, x = new_x_55_cast_fp16)[name = tensor("x_359_cast_fp16")]; tensor input_731_perm_0 = const()[name = tensor("input_731_perm_0"), val = tensor([0, 2, 1])]; tensor x_361_axes_0 = const()[name = tensor("x_361_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_13_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171269504)))]; tensor encoder_layers_13_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_13_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171270592)))]; tensor input_731_cast_fp16 = transpose(perm = input_731_perm_0, x = x_359_cast_fp16)[name = tensor("transpose_115")]; tensor x_361_cast_fp16 = layer_norm(axes = x_361_axes_0, beta = encoder_layers_13_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_conv_batch_norm_weight_to_fp16, x = input_731_cast_fp16)[name = tensor("x_361_cast_fp16")]; tensor input_733_perm_0 = const()[name = tensor("input_733_perm_0"), val = tensor([0, 2, 1])]; tensor input_733_cast_fp16 = transpose(perm = input_733_perm_0, x = x_361_cast_fp16)[name = tensor("transpose_114")]; tensor input_735_cast_fp16 = silu(x = input_733_cast_fp16)[name = tensor("input_735_cast_fp16")]; tensor x_363_pad_type_0 = const()[name = tensor("x_363_pad_type_0"), val = tensor("valid")]; tensor x_363_strides_0 = const()[name = tensor("x_363_strides_0"), val = tensor([1])]; tensor x_363_pad_0 = const()[name = tensor("x_363_pad_0"), val = tensor([0, 0])]; tensor x_363_dilations_0 = const()[name = tensor("x_363_dilations_0"), val = tensor([1])]; tensor x_363_groups_0 = const()[name = tensor("x_363_groups_0"), val = tensor(1)]; tensor encoder_layers_13_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171271680)))]; tensor x_363_cast_fp16 = conv(dilations = x_363_dilations_0, groups = x_363_groups_0, pad = x_363_pad_0, pad_type = x_363_pad_type_0, strides = x_363_strides_0, weight = encoder_layers_13_conv_pointwise_conv2_weight_to_fp16, x = input_735_cast_fp16)[name = tensor("x_363_cast_fp16")]; tensor input_737_perm_0 = const()[name = tensor("input_737_perm_0"), val = tensor([0, 2, 1])]; tensor input_737_cast_fp16 = transpose(perm = input_737_perm_0, x = x_363_cast_fp16)[name = tensor("transpose_113")]; tensor input_739_cast_fp16 = add(x = input_723_cast_fp16, y = input_737_cast_fp16)[name = tensor("input_739_cast_fp16")]; tensor input_741_axes_0 = const()[name = tensor("input_741_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171796032)))]; tensor encoder_layers_13_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171797120)))]; tensor input_741_cast_fp16 = layer_norm(axes = input_741_axes_0, beta = encoder_layers_13_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_norm_feed_forward2_weight_to_fp16, x = input_739_cast_fp16)[name = tensor("input_741_cast_fp16")]; tensor encoder_layers_13_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(171798208)))]; tensor linear_125_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_13_feed_forward2_linear1_weight_to_fp16, x = input_741_cast_fp16)[name = tensor("linear_125_cast_fp16")]; tensor input_745_cast_fp16 = silu(x = linear_125_cast_fp16)[name = tensor("input_745_cast_fp16")]; tensor encoder_layers_13_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_13_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(173895424)))]; tensor linear_126_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_13_feed_forward2_linear2_weight_to_fp16, x = input_745_cast_fp16)[name = tensor("linear_126_cast_fp16")]; tensor var_3166_to_fp16 = const()[name = tensor("op_3166_to_fp16"), val = tensor(0x1p-1)]; tensor var_3167_cast_fp16 = mul(x = linear_126_cast_fp16, y = var_3166_to_fp16)[name = tensor("op_3167_cast_fp16")]; tensor input_751_cast_fp16 = add(x = input_739_cast_fp16, y = var_3167_cast_fp16)[name = tensor("input_751_cast_fp16")]; tensor input_753_axes_0 = const()[name = tensor("input_753_axes_0"), val = tensor([-1])]; tensor encoder_layers_13_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_13_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175992640)))]; tensor encoder_layers_13_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_13_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175993728)))]; tensor input_753_cast_fp16 = layer_norm(axes = input_753_axes_0, beta = encoder_layers_13_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_13_norm_out_weight_to_fp16, x = input_751_cast_fp16)[name = tensor("input_753_cast_fp16")]; tensor cache_57_begin_0 = const()[name = tensor("cache_57_begin_0"), val = tensor([14, 0, 0, 0])]; tensor cache_57_end_0 = const()[name = tensor("cache_57_end_0"), val = tensor([15, 1, 70, 512])]; tensor cache_57_end_mask_0 = const()[name = tensor("cache_57_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_57_squeeze_mask_0 = const()[name = tensor("cache_57_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_57_cast_fp16 = slice_by_index(begin = cache_57_begin_0, end = cache_57_end_0, end_mask = cache_57_end_mask_0, squeeze_mask = cache_57_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_57_cast_fp16")]; tensor cache_59_begin_0 = const()[name = tensor("cache_59_begin_0"), val = tensor([14, 0, 0, 0])]; tensor cache_59_end_0 = const()[name = tensor("cache_59_end_0"), val = tensor([15, 1, 512, 8])]; tensor cache_59_end_mask_0 = const()[name = tensor("cache_59_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_59_squeeze_mask_0 = const()[name = tensor("cache_59_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_59_cast_fp16 = slice_by_index(begin = cache_59_begin_0, end = cache_59_end_0, end_mask = cache_59_end_mask_0, squeeze_mask = cache_59_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_59_cast_fp16")]; tensor input_755_axes_0 = const()[name = tensor("input_755_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175994816)))]; tensor encoder_layers_14_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175995904)))]; tensor input_755_cast_fp16 = layer_norm(axes = input_755_axes_0, beta = encoder_layers_14_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_norm_feed_forward1_weight_to_fp16, x = input_753_cast_fp16)[name = tensor("input_755_cast_fp16")]; tensor encoder_layers_14_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175996992)))]; tensor linear_127_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_14_feed_forward1_linear1_weight_to_fp16, x = input_755_cast_fp16)[name = tensor("linear_127_cast_fp16")]; tensor input_759_cast_fp16 = silu(x = linear_127_cast_fp16)[name = tensor("input_759_cast_fp16")]; tensor encoder_layers_14_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178094208)))]; tensor linear_128_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_feed_forward1_linear2_weight_to_fp16, x = input_759_cast_fp16)[name = tensor("linear_128_cast_fp16")]; tensor var_3201_to_fp16 = const()[name = tensor("op_3201_to_fp16"), val = tensor(0x1p-1)]; tensor var_3202_cast_fp16 = mul(x = linear_128_cast_fp16, y = var_3201_to_fp16)[name = tensor("op_3202_cast_fp16")]; tensor input_765_cast_fp16 = add(x = input_753_cast_fp16, y = var_3202_cast_fp16)[name = tensor("input_765_cast_fp16")]; tensor key_29_axes_0 = const()[name = tensor("key_29_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180191424)))]; tensor encoder_layers_14_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180192512)))]; tensor key_29_cast_fp16 = layer_norm(axes = key_29_axes_0, beta = encoder_layers_14_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_norm_self_att_weight_to_fp16, x = input_765_cast_fp16)[name = tensor("key_29_cast_fp16")]; tensor input_767_interleave_0 = const()[name = tensor("input_767_interleave_0"), val = tensor(false)]; tensor input_767_cast_fp16 = concat(axis = var_64, interleave = input_767_interleave_0, values = (cache_57_cast_fp16, key_29_cast_fp16))[name = tensor("input_767_cast_fp16")]; tensor var_3224_begin_0 = const()[name = tensor("op_3224_begin_0"), val = tensor([0, 1, 0])]; tensor var_3224_end_0 = const()[name = tensor("op_3224_end_0"), val = tensor([1, 70, 512])]; tensor var_3224_end_mask_0 = const()[name = tensor("op_3224_end_mask_0"), val = tensor([true, true, true])]; tensor var_3224_cast_fp16 = slice_by_index(begin = var_3224_begin_0, end = var_3224_end_0, end_mask = var_3224_end_mask_0, x = cache_57_cast_fp16)[name = tensor("op_3224_cast_fp16")]; tensor var_3227_begin_0 = const()[name = tensor("op_3227_begin_0"), val = tensor([0, 0, 0])]; tensor var_3227_end_0 = const()[name = tensor("op_3227_end_0"), val = tensor([1, 1, 512])]; tensor var_3227_end_mask_0 = const()[name = tensor("op_3227_end_mask_0"), val = tensor([true, false, true])]; tensor var_3227_cast_fp16 = slice_by_index(begin = var_3227_begin_0, end = var_3227_end_0, end_mask = var_3227_end_mask_0, x = key_29_cast_fp16)[name = tensor("op_3227_cast_fp16")]; tensor var_3230_interleave_0 = const()[name = tensor("op_3230_interleave_0"), val = tensor(false)]; tensor var_3230_cast_fp16 = concat(axis = var_64, interleave = var_3230_interleave_0, values = (var_3224_cast_fp16, var_3227_cast_fp16))[name = tensor("op_3230_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180193600)))]; tensor linear_129_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_self_attn_linear_q_weight_to_fp16, x = key_29_cast_fp16)[name = tensor("linear_129_cast_fp16")]; tensor var_3234 = const()[name = tensor("op_3234"), val = tensor([1, -1, 8, 64])]; tensor q_85_cast_fp16 = reshape(shape = var_3234, x = linear_129_cast_fp16)[name = tensor("q_85_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180717952)))]; tensor linear_130_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_self_attn_linear_k_weight_to_fp16, x = input_767_cast_fp16)[name = tensor("linear_130_cast_fp16")]; tensor var_3238 = const()[name = tensor("op_3238"), val = tensor([1, -1, 8, 64])]; tensor k_57_cast_fp16 = reshape(shape = var_3238, x = linear_130_cast_fp16)[name = tensor("k_57_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181242304)))]; tensor linear_131_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_self_attn_linear_v_weight_to_fp16, x = input_767_cast_fp16)[name = tensor("linear_131_cast_fp16")]; tensor var_3242 = const()[name = tensor("op_3242"), val = tensor([1, -1, 8, 64])]; tensor v_29_cast_fp16 = reshape(shape = var_3242, x = linear_131_cast_fp16)[name = tensor("v_29_cast_fp16")]; tensor value_31_perm_0 = const()[name = tensor("value_31_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_14_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181766656)))]; tensor var_3254_cast_fp16 = add(x = q_85_cast_fp16, y = encoder_layers_14_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3254_cast_fp16")]; tensor encoder_layers_14_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181767744)))]; tensor var_3256_cast_fp16 = add(x = q_85_cast_fp16, y = encoder_layers_14_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3256_cast_fp16")]; tensor q_with_bias_v_29_perm_0 = const()[name = tensor("q_with_bias_v_29_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_371_transpose_x_0 = const()[name = tensor("x_371_transpose_x_0"), val = tensor(false)]; tensor x_371_transpose_y_0 = const()[name = tensor("x_371_transpose_y_0"), val = tensor(false)]; tensor var_3258_to_fp16 = const()[name = tensor("op_3258_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181768832)))]; tensor q_with_bias_v_29_cast_fp16 = transpose(perm = q_with_bias_v_29_perm_0, x = var_3256_cast_fp16)[name = tensor("transpose_111")]; tensor x_371_cast_fp16 = matmul(transpose_x = x_371_transpose_x_0, transpose_y = x_371_transpose_y_0, x = q_with_bias_v_29_cast_fp16, y = var_3258_to_fp16)[name = tensor("x_371_cast_fp16")]; tensor x_373_pad_0 = const()[name = tensor("x_373_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_373_mode_0 = const()[name = tensor("x_373_mode_0"), val = tensor("constant")]; tensor const_205_to_fp16 = const()[name = tensor("const_205_to_fp16"), val = tensor(0x0p+0)]; tensor x_373_cast_fp16 = pad(constant_val = const_205_to_fp16, mode = x_373_mode_0, pad = x_373_pad_0, x = x_371_cast_fp16)[name = tensor("x_373_cast_fp16")]; tensor var_3266 = const()[name = tensor("op_3266"), val = tensor([1, 8, -1, 3])]; tensor x_375_cast_fp16 = reshape(shape = var_3266, x = x_373_cast_fp16)[name = tensor("x_375_cast_fp16")]; tensor var_3270_begin_0 = const()[name = tensor("op_3270_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3270_end_0 = const()[name = tensor("op_3270_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_3270_end_mask_0 = const()[name = tensor("op_3270_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3270_cast_fp16 = slice_by_index(begin = var_3270_begin_0, end = var_3270_end_0, end_mask = var_3270_end_mask_0, x = x_375_cast_fp16)[name = tensor("op_3270_cast_fp16")]; tensor var_3271 = const()[name = tensor("op_3271"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_57_cast_fp16 = reshape(shape = var_3271, x = var_3270_cast_fp16)[name = tensor("matrix_bd_57_cast_fp16")]; tensor matrix_ac_29_transpose_x_0 = const()[name = tensor("matrix_ac_29_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_29_transpose_y_0 = const()[name = tensor("matrix_ac_29_transpose_y_0"), val = tensor(false)]; tensor transpose_79_perm_0 = const()[name = tensor("transpose_79_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_80_perm_0 = const()[name = tensor("transpose_80_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_80 = transpose(perm = transpose_80_perm_0, x = k_57_cast_fp16)[name = tensor("transpose_109")]; tensor transpose_79 = transpose(perm = transpose_79_perm_0, x = var_3254_cast_fp16)[name = tensor("transpose_110")]; tensor matrix_ac_29_cast_fp16 = matmul(transpose_x = matrix_ac_29_transpose_x_0, transpose_y = matrix_ac_29_transpose_y_0, x = transpose_79, y = transpose_80)[name = tensor("matrix_ac_29_cast_fp16")]; tensor matrix_bd_59_begin_0 = const()[name = tensor("matrix_bd_59_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_59_end_0 = const()[name = tensor("matrix_bd_59_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_59_end_mask_0 = const()[name = tensor("matrix_bd_59_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_59_cast_fp16 = slice_by_index(begin = matrix_bd_59_begin_0, end = matrix_bd_59_end_0, end_mask = matrix_bd_59_end_mask_0, x = matrix_bd_57_cast_fp16)[name = tensor("matrix_bd_59_cast_fp16")]; tensor var_3280_cast_fp16 = add(x = matrix_ac_29_cast_fp16, y = matrix_bd_59_cast_fp16)[name = tensor("op_3280_cast_fp16")]; tensor _inversed_scores_57_y_0_to_fp16 = const()[name = tensor("_inversed_scores_57_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_57_cast_fp16 = mul(x = var_3280_cast_fp16, y = _inversed_scores_57_y_0_to_fp16)[name = tensor("_inversed_scores_57_cast_fp16")]; tensor scores_59_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_57_cast_fp16, cond = mask_3)[name = tensor("scores_59_cast_fp16")]; tensor var_3286_cast_fp16 = softmax(axis = var_62, x = scores_59_cast_fp16)[name = tensor("op_3286_cast_fp16")]; tensor input_769_cast_fp16 = select(a = var_40_to_fp16, b = var_3286_cast_fp16, cond = mask_3)[name = tensor("input_769_cast_fp16")]; tensor x_377_transpose_x_0 = const()[name = tensor("x_377_transpose_x_0"), val = tensor(false)]; tensor x_377_transpose_y_0 = const()[name = tensor("x_377_transpose_y_0"), val = tensor(false)]; tensor value_31_cast_fp16 = transpose(perm = value_31_perm_0, x = v_29_cast_fp16)[name = tensor("transpose_112")]; tensor x_377_cast_fp16 = matmul(transpose_x = x_377_transpose_x_0, transpose_y = x_377_transpose_y_0, x = input_769_cast_fp16, y = value_31_cast_fp16)[name = tensor("x_377_cast_fp16")]; tensor var_3290_perm_0 = const()[name = tensor("op_3290_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3291 = const()[name = tensor("op_3291"), val = tensor([1, -1, 512])]; tensor var_3290_cast_fp16 = transpose(perm = var_3290_perm_0, x = x_377_cast_fp16)[name = tensor("transpose_108")]; tensor input_771_cast_fp16 = reshape(shape = var_3291, x = var_3290_cast_fp16)[name = tensor("input_771_cast_fp16")]; tensor encoder_layers_14_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_14_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181917376)))]; tensor linear_133_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_self_attn_linear_out_weight_to_fp16, x = input_771_cast_fp16)[name = tensor("linear_133_cast_fp16")]; tensor input_775_cast_fp16 = add(x = input_765_cast_fp16, y = linear_133_cast_fp16)[name = tensor("input_775_cast_fp16")]; tensor x_381_axes_0 = const()[name = tensor("x_381_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182441728)))]; tensor encoder_layers_14_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182442816)))]; tensor x_381_cast_fp16 = layer_norm(axes = x_381_axes_0, beta = encoder_layers_14_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_norm_conv_weight_to_fp16, x = input_775_cast_fp16)[name = tensor("x_381_cast_fp16")]; tensor input_777_perm_0 = const()[name = tensor("input_777_perm_0"), val = tensor([0, 2, 1])]; tensor input_779_pad_type_0 = const()[name = tensor("input_779_pad_type_0"), val = tensor("valid")]; tensor input_779_strides_0 = const()[name = tensor("input_779_strides_0"), val = tensor([1])]; tensor input_779_pad_0 = const()[name = tensor("input_779_pad_0"), val = tensor([0, 0])]; tensor input_779_dilations_0 = const()[name = tensor("input_779_dilations_0"), val = tensor([1])]; tensor input_779_groups_0 = const()[name = tensor("input_779_groups_0"), val = tensor(1)]; tensor encoder_layers_14_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182443904)))]; tensor input_777_cast_fp16 = transpose(perm = input_777_perm_0, x = x_381_cast_fp16)[name = tensor("transpose_107")]; tensor input_779_cast_fp16 = conv(dilations = input_779_dilations_0, groups = input_779_groups_0, pad = input_779_pad_0, pad_type = input_779_pad_type_0, strides = input_779_strides_0, weight = encoder_layers_14_conv_pointwise_conv1_weight_to_fp16, x = input_777_cast_fp16)[name = tensor("input_779_cast_fp16")]; tensor x_383_split_num_splits_0 = const()[name = tensor("x_383_split_num_splits_0"), val = tensor(2)]; tensor x_383_split_axis_0 = const()[name = tensor("x_383_split_axis_0"), val = tensor(1)]; tensor x_383_split_cast_fp16_0, tensor x_383_split_cast_fp16_1 = split(axis = x_383_split_axis_0, num_splits = x_383_split_num_splits_0, x = input_779_cast_fp16)[name = tensor("x_383_split_cast_fp16")]; tensor x_383_split_1_sigmoid_cast_fp16 = sigmoid(x = x_383_split_cast_fp16_1)[name = tensor("x_383_split_1_sigmoid_cast_fp16")]; tensor x_383_cast_fp16 = mul(x = x_383_split_cast_fp16_0, y = x_383_split_1_sigmoid_cast_fp16)[name = tensor("x_383_cast_fp16")]; tensor input_781_cast_fp16 = select(a = var_40_to_fp16, b = x_383_cast_fp16, cond = var_418)[name = tensor("input_781_cast_fp16")]; tensor new_x_59_interleave_0 = const()[name = tensor("new_x_59_interleave_0"), val = tensor(false)]; tensor new_x_59_cast_fp16 = concat(axis = var_62, interleave = new_x_59_interleave_0, values = (cache_59_cast_fp16, input_781_cast_fp16))[name = tensor("new_x_59_cast_fp16")]; tensor next_cache_29_begin_0 = const()[name = tensor("next_cache_29_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_29_end_0 = const()[name = tensor("next_cache_29_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_29_end_mask_0 = const()[name = tensor("next_cache_29_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_29_cast_fp16 = slice_by_index(begin = next_cache_29_begin_0, end = next_cache_29_end_0, end_mask = next_cache_29_end_mask_0, x = new_x_59_cast_fp16)[name = tensor("next_cache_29_cast_fp16")]; tensor var_3332_begin_0 = const()[name = tensor("op_3332_begin_0"), val = tensor([0, 0, 1])]; tensor var_3332_end_0 = const()[name = tensor("op_3332_end_0"), val = tensor([1, 512, 9])]; tensor var_3332_end_mask_0 = const()[name = tensor("op_3332_end_mask_0"), val = tensor([true, true, true])]; tensor var_3332_cast_fp16 = slice_by_index(begin = var_3332_begin_0, end = var_3332_end_0, end_mask = var_3332_end_mask_0, x = next_cache_29_cast_fp16)[name = tensor("op_3332_cast_fp16")]; tensor x_385_pad_type_0 = const()[name = tensor("x_385_pad_type_0"), val = tensor("valid")]; tensor x_385_groups_0 = const()[name = tensor("x_385_groups_0"), val = tensor(512)]; tensor x_385_strides_0 = const()[name = tensor("x_385_strides_0"), val = tensor([1])]; tensor x_385_pad_0 = const()[name = tensor("x_385_pad_0"), val = tensor([0, 0])]; tensor x_385_dilations_0 = const()[name = tensor("x_385_dilations_0"), val = tensor([1])]; tensor encoder_layers_14_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_14_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183492544)))]; tensor x_385_cast_fp16 = conv(dilations = x_385_dilations_0, groups = x_385_groups_0, pad = x_385_pad_0, pad_type = x_385_pad_type_0, strides = x_385_strides_0, weight = encoder_layers_14_conv_depthwise_conv_weight_to_fp16, x = new_x_59_cast_fp16)[name = tensor("x_385_cast_fp16")]; tensor input_783_perm_0 = const()[name = tensor("input_783_perm_0"), val = tensor([0, 2, 1])]; tensor x_387_axes_0 = const()[name = tensor("x_387_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_14_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183501824)))]; tensor encoder_layers_14_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_14_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183502912)))]; tensor input_783_cast_fp16 = transpose(perm = input_783_perm_0, x = x_385_cast_fp16)[name = tensor("transpose_106")]; tensor x_387_cast_fp16 = layer_norm(axes = x_387_axes_0, beta = encoder_layers_14_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_conv_batch_norm_weight_to_fp16, x = input_783_cast_fp16)[name = tensor("x_387_cast_fp16")]; tensor input_785_perm_0 = const()[name = tensor("input_785_perm_0"), val = tensor([0, 2, 1])]; tensor input_785_cast_fp16 = transpose(perm = input_785_perm_0, x = x_387_cast_fp16)[name = tensor("transpose_105")]; tensor input_787_cast_fp16 = silu(x = input_785_cast_fp16)[name = tensor("input_787_cast_fp16")]; tensor x_389_pad_type_0 = const()[name = tensor("x_389_pad_type_0"), val = tensor("valid")]; tensor x_389_strides_0 = const()[name = tensor("x_389_strides_0"), val = tensor([1])]; tensor x_389_pad_0 = const()[name = tensor("x_389_pad_0"), val = tensor([0, 0])]; tensor x_389_dilations_0 = const()[name = tensor("x_389_dilations_0"), val = tensor([1])]; tensor x_389_groups_0 = const()[name = tensor("x_389_groups_0"), val = tensor(1)]; tensor encoder_layers_14_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183504000)))]; tensor x_389_cast_fp16 = conv(dilations = x_389_dilations_0, groups = x_389_groups_0, pad = x_389_pad_0, pad_type = x_389_pad_type_0, strides = x_389_strides_0, weight = encoder_layers_14_conv_pointwise_conv2_weight_to_fp16, x = input_787_cast_fp16)[name = tensor("x_389_cast_fp16")]; tensor input_789_perm_0 = const()[name = tensor("input_789_perm_0"), val = tensor([0, 2, 1])]; tensor input_789_cast_fp16 = transpose(perm = input_789_perm_0, x = x_389_cast_fp16)[name = tensor("transpose_104")]; tensor input_791_cast_fp16 = add(x = input_775_cast_fp16, y = input_789_cast_fp16)[name = tensor("input_791_cast_fp16")]; tensor input_793_axes_0 = const()[name = tensor("input_793_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184028352)))]; tensor encoder_layers_14_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184029440)))]; tensor input_793_cast_fp16 = layer_norm(axes = input_793_axes_0, beta = encoder_layers_14_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_norm_feed_forward2_weight_to_fp16, x = input_791_cast_fp16)[name = tensor("input_793_cast_fp16")]; tensor encoder_layers_14_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184030528)))]; tensor linear_134_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_14_feed_forward2_linear1_weight_to_fp16, x = input_793_cast_fp16)[name = tensor("linear_134_cast_fp16")]; tensor input_797_cast_fp16 = silu(x = linear_134_cast_fp16)[name = tensor("input_797_cast_fp16")]; tensor encoder_layers_14_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_14_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186127744)))]; tensor linear_135_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_14_feed_forward2_linear2_weight_to_fp16, x = input_797_cast_fp16)[name = tensor("linear_135_cast_fp16")]; tensor var_3373_to_fp16 = const()[name = tensor("op_3373_to_fp16"), val = tensor(0x1p-1)]; tensor var_3374_cast_fp16 = mul(x = linear_135_cast_fp16, y = var_3373_to_fp16)[name = tensor("op_3374_cast_fp16")]; tensor input_803_cast_fp16 = add(x = input_791_cast_fp16, y = var_3374_cast_fp16)[name = tensor("input_803_cast_fp16")]; tensor input_805_axes_0 = const()[name = tensor("input_805_axes_0"), val = tensor([-1])]; tensor encoder_layers_14_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_14_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188224960)))]; tensor encoder_layers_14_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_14_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188226048)))]; tensor input_805_cast_fp16 = layer_norm(axes = input_805_axes_0, beta = encoder_layers_14_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_14_norm_out_weight_to_fp16, x = input_803_cast_fp16)[name = tensor("input_805_cast_fp16")]; tensor cache_61_begin_0 = const()[name = tensor("cache_61_begin_0"), val = tensor([15, 0, 0, 0])]; tensor cache_61_end_0 = const()[name = tensor("cache_61_end_0"), val = tensor([16, 1, 70, 512])]; tensor cache_61_end_mask_0 = const()[name = tensor("cache_61_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_61_squeeze_mask_0 = const()[name = tensor("cache_61_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_61_cast_fp16 = slice_by_index(begin = cache_61_begin_0, end = cache_61_end_0, end_mask = cache_61_end_mask_0, squeeze_mask = cache_61_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_61_cast_fp16")]; tensor cache_63_begin_0 = const()[name = tensor("cache_63_begin_0"), val = tensor([15, 0, 0, 0])]; tensor cache_63_end_0 = const()[name = tensor("cache_63_end_0"), val = tensor([16, 1, 512, 8])]; tensor cache_63_end_mask_0 = const()[name = tensor("cache_63_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_63_squeeze_mask_0 = const()[name = tensor("cache_63_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_63_cast_fp16 = slice_by_index(begin = cache_63_begin_0, end = cache_63_end_0, end_mask = cache_63_end_mask_0, squeeze_mask = cache_63_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_63_cast_fp16")]; tensor input_807_axes_0 = const()[name = tensor("input_807_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188227136)))]; tensor encoder_layers_15_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188228224)))]; tensor input_807_cast_fp16 = layer_norm(axes = input_807_axes_0, beta = encoder_layers_15_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_norm_feed_forward1_weight_to_fp16, x = input_805_cast_fp16)[name = tensor("input_807_cast_fp16")]; tensor encoder_layers_15_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188229312)))]; tensor linear_136_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_15_feed_forward1_linear1_weight_to_fp16, x = input_807_cast_fp16)[name = tensor("linear_136_cast_fp16")]; tensor input_811_cast_fp16 = silu(x = linear_136_cast_fp16)[name = tensor("input_811_cast_fp16")]; tensor encoder_layers_15_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190326528)))]; tensor linear_137_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_feed_forward1_linear2_weight_to_fp16, x = input_811_cast_fp16)[name = tensor("linear_137_cast_fp16")]; tensor var_3408_to_fp16 = const()[name = tensor("op_3408_to_fp16"), val = tensor(0x1p-1)]; tensor var_3409_cast_fp16 = mul(x = linear_137_cast_fp16, y = var_3408_to_fp16)[name = tensor("op_3409_cast_fp16")]; tensor input_817_cast_fp16 = add(x = input_805_cast_fp16, y = var_3409_cast_fp16)[name = tensor("input_817_cast_fp16")]; tensor key_31_axes_0 = const()[name = tensor("key_31_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192423744)))]; tensor encoder_layers_15_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192424832)))]; tensor key_31_cast_fp16 = layer_norm(axes = key_31_axes_0, beta = encoder_layers_15_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_norm_self_att_weight_to_fp16, x = input_817_cast_fp16)[name = tensor("key_31_cast_fp16")]; tensor input_819_interleave_0 = const()[name = tensor("input_819_interleave_0"), val = tensor(false)]; tensor input_819_cast_fp16 = concat(axis = var_64, interleave = input_819_interleave_0, values = (cache_61_cast_fp16, key_31_cast_fp16))[name = tensor("input_819_cast_fp16")]; tensor var_3431_begin_0 = const()[name = tensor("op_3431_begin_0"), val = tensor([0, 1, 0])]; tensor var_3431_end_0 = const()[name = tensor("op_3431_end_0"), val = tensor([1, 70, 512])]; tensor var_3431_end_mask_0 = const()[name = tensor("op_3431_end_mask_0"), val = tensor([true, true, true])]; tensor var_3431_cast_fp16 = slice_by_index(begin = var_3431_begin_0, end = var_3431_end_0, end_mask = var_3431_end_mask_0, x = cache_61_cast_fp16)[name = tensor("op_3431_cast_fp16")]; tensor var_3434_begin_0 = const()[name = tensor("op_3434_begin_0"), val = tensor([0, 0, 0])]; tensor var_3434_end_0 = const()[name = tensor("op_3434_end_0"), val = tensor([1, 1, 512])]; tensor var_3434_end_mask_0 = const()[name = tensor("op_3434_end_mask_0"), val = tensor([true, false, true])]; tensor var_3434_cast_fp16 = slice_by_index(begin = var_3434_begin_0, end = var_3434_end_0, end_mask = var_3434_end_mask_0, x = key_31_cast_fp16)[name = tensor("op_3434_cast_fp16")]; tensor var_3437_interleave_0 = const()[name = tensor("op_3437_interleave_0"), val = tensor(false)]; tensor var_3437_cast_fp16 = concat(axis = var_64, interleave = var_3437_interleave_0, values = (var_3431_cast_fp16, var_3434_cast_fp16))[name = tensor("op_3437_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192425920)))]; tensor linear_138_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_self_attn_linear_q_weight_to_fp16, x = key_31_cast_fp16)[name = tensor("linear_138_cast_fp16")]; tensor var_3441 = const()[name = tensor("op_3441"), val = tensor([1, -1, 8, 64])]; tensor q_91_cast_fp16 = reshape(shape = var_3441, x = linear_138_cast_fp16)[name = tensor("q_91_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192950272)))]; tensor linear_139_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_self_attn_linear_k_weight_to_fp16, x = input_819_cast_fp16)[name = tensor("linear_139_cast_fp16")]; tensor var_3445 = const()[name = tensor("op_3445"), val = tensor([1, -1, 8, 64])]; tensor k_61_cast_fp16 = reshape(shape = var_3445, x = linear_139_cast_fp16)[name = tensor("k_61_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193474624)))]; tensor linear_140_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_self_attn_linear_v_weight_to_fp16, x = input_819_cast_fp16)[name = tensor("linear_140_cast_fp16")]; tensor var_3449 = const()[name = tensor("op_3449"), val = tensor([1, -1, 8, 64])]; tensor v_31_cast_fp16 = reshape(shape = var_3449, x = linear_140_cast_fp16)[name = tensor("v_31_cast_fp16")]; tensor value_33_perm_0 = const()[name = tensor("value_33_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_15_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193998976)))]; tensor var_3461_cast_fp16 = add(x = q_91_cast_fp16, y = encoder_layers_15_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3461_cast_fp16")]; tensor encoder_layers_15_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194000064)))]; tensor var_3463_cast_fp16 = add(x = q_91_cast_fp16, y = encoder_layers_15_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3463_cast_fp16")]; tensor q_with_bias_v_31_perm_0 = const()[name = tensor("q_with_bias_v_31_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_397_transpose_x_0 = const()[name = tensor("x_397_transpose_x_0"), val = tensor(false)]; tensor x_397_transpose_y_0 = const()[name = tensor("x_397_transpose_y_0"), val = tensor(false)]; tensor var_3465_to_fp16 = const()[name = tensor("op_3465_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194001152)))]; tensor q_with_bias_v_31_cast_fp16 = transpose(perm = q_with_bias_v_31_perm_0, x = var_3463_cast_fp16)[name = tensor("transpose_102")]; tensor x_397_cast_fp16 = matmul(transpose_x = x_397_transpose_x_0, transpose_y = x_397_transpose_y_0, x = q_with_bias_v_31_cast_fp16, y = var_3465_to_fp16)[name = tensor("x_397_cast_fp16")]; tensor x_399_pad_0 = const()[name = tensor("x_399_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_399_mode_0 = const()[name = tensor("x_399_mode_0"), val = tensor("constant")]; tensor const_218_to_fp16 = const()[name = tensor("const_218_to_fp16"), val = tensor(0x0p+0)]; tensor x_399_cast_fp16 = pad(constant_val = const_218_to_fp16, mode = x_399_mode_0, pad = x_399_pad_0, x = x_397_cast_fp16)[name = tensor("x_399_cast_fp16")]; tensor var_3473 = const()[name = tensor("op_3473"), val = tensor([1, 8, -1, 3])]; tensor x_401_cast_fp16 = reshape(shape = var_3473, x = x_399_cast_fp16)[name = tensor("x_401_cast_fp16")]; tensor var_3477_begin_0 = const()[name = tensor("op_3477_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3477_end_0 = const()[name = tensor("op_3477_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_3477_end_mask_0 = const()[name = tensor("op_3477_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3477_cast_fp16 = slice_by_index(begin = var_3477_begin_0, end = var_3477_end_0, end_mask = var_3477_end_mask_0, x = x_401_cast_fp16)[name = tensor("op_3477_cast_fp16")]; tensor var_3478 = const()[name = tensor("op_3478"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_61_cast_fp16 = reshape(shape = var_3478, x = var_3477_cast_fp16)[name = tensor("matrix_bd_61_cast_fp16")]; tensor matrix_ac_31_transpose_x_0 = const()[name = tensor("matrix_ac_31_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_31_transpose_y_0 = const()[name = tensor("matrix_ac_31_transpose_y_0"), val = tensor(false)]; tensor transpose_81_perm_0 = const()[name = tensor("transpose_81_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_82_perm_0 = const()[name = tensor("transpose_82_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_82 = transpose(perm = transpose_82_perm_0, x = k_61_cast_fp16)[name = tensor("transpose_100")]; tensor transpose_81 = transpose(perm = transpose_81_perm_0, x = var_3461_cast_fp16)[name = tensor("transpose_101")]; tensor matrix_ac_31_cast_fp16 = matmul(transpose_x = matrix_ac_31_transpose_x_0, transpose_y = matrix_ac_31_transpose_y_0, x = transpose_81, y = transpose_82)[name = tensor("matrix_ac_31_cast_fp16")]; tensor matrix_bd_63_begin_0 = const()[name = tensor("matrix_bd_63_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_63_end_0 = const()[name = tensor("matrix_bd_63_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_63_end_mask_0 = const()[name = tensor("matrix_bd_63_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_63_cast_fp16 = slice_by_index(begin = matrix_bd_63_begin_0, end = matrix_bd_63_end_0, end_mask = matrix_bd_63_end_mask_0, x = matrix_bd_61_cast_fp16)[name = tensor("matrix_bd_63_cast_fp16")]; tensor var_3487_cast_fp16 = add(x = matrix_ac_31_cast_fp16, y = matrix_bd_63_cast_fp16)[name = tensor("op_3487_cast_fp16")]; tensor _inversed_scores_61_y_0_to_fp16 = const()[name = tensor("_inversed_scores_61_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_61_cast_fp16 = mul(x = var_3487_cast_fp16, y = _inversed_scores_61_y_0_to_fp16)[name = tensor("_inversed_scores_61_cast_fp16")]; tensor scores_63_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_61_cast_fp16, cond = mask_3)[name = tensor("scores_63_cast_fp16")]; tensor var_3493_cast_fp16 = softmax(axis = var_62, x = scores_63_cast_fp16)[name = tensor("op_3493_cast_fp16")]; tensor input_821_cast_fp16 = select(a = var_40_to_fp16, b = var_3493_cast_fp16, cond = mask_3)[name = tensor("input_821_cast_fp16")]; tensor x_403_transpose_x_0 = const()[name = tensor("x_403_transpose_x_0"), val = tensor(false)]; tensor x_403_transpose_y_0 = const()[name = tensor("x_403_transpose_y_0"), val = tensor(false)]; tensor value_33_cast_fp16 = transpose(perm = value_33_perm_0, x = v_31_cast_fp16)[name = tensor("transpose_103")]; tensor x_403_cast_fp16 = matmul(transpose_x = x_403_transpose_x_0, transpose_y = x_403_transpose_y_0, x = input_821_cast_fp16, y = value_33_cast_fp16)[name = tensor("x_403_cast_fp16")]; tensor var_3497_perm_0 = const()[name = tensor("op_3497_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3498 = const()[name = tensor("op_3498"), val = tensor([1, -1, 512])]; tensor var_3497_cast_fp16 = transpose(perm = var_3497_perm_0, x = x_403_cast_fp16)[name = tensor("transpose_99")]; tensor input_823_cast_fp16 = reshape(shape = var_3498, x = var_3497_cast_fp16)[name = tensor("input_823_cast_fp16")]; tensor encoder_layers_15_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_15_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194149696)))]; tensor linear_142_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_self_attn_linear_out_weight_to_fp16, x = input_823_cast_fp16)[name = tensor("linear_142_cast_fp16")]; tensor input_827_cast_fp16 = add(x = input_817_cast_fp16, y = linear_142_cast_fp16)[name = tensor("input_827_cast_fp16")]; tensor x_407_axes_0 = const()[name = tensor("x_407_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194674048)))]; tensor encoder_layers_15_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194675136)))]; tensor x_407_cast_fp16 = layer_norm(axes = x_407_axes_0, beta = encoder_layers_15_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_norm_conv_weight_to_fp16, x = input_827_cast_fp16)[name = tensor("x_407_cast_fp16")]; tensor input_829_perm_0 = const()[name = tensor("input_829_perm_0"), val = tensor([0, 2, 1])]; tensor input_831_pad_type_0 = const()[name = tensor("input_831_pad_type_0"), val = tensor("valid")]; tensor input_831_strides_0 = const()[name = tensor("input_831_strides_0"), val = tensor([1])]; tensor input_831_pad_0 = const()[name = tensor("input_831_pad_0"), val = tensor([0, 0])]; tensor input_831_dilations_0 = const()[name = tensor("input_831_dilations_0"), val = tensor([1])]; tensor input_831_groups_0 = const()[name = tensor("input_831_groups_0"), val = tensor(1)]; tensor encoder_layers_15_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194676224)))]; tensor input_829_cast_fp16 = transpose(perm = input_829_perm_0, x = x_407_cast_fp16)[name = tensor("transpose_98")]; tensor input_831_cast_fp16 = conv(dilations = input_831_dilations_0, groups = input_831_groups_0, pad = input_831_pad_0, pad_type = input_831_pad_type_0, strides = input_831_strides_0, weight = encoder_layers_15_conv_pointwise_conv1_weight_to_fp16, x = input_829_cast_fp16)[name = tensor("input_831_cast_fp16")]; tensor x_409_split_num_splits_0 = const()[name = tensor("x_409_split_num_splits_0"), val = tensor(2)]; tensor x_409_split_axis_0 = const()[name = tensor("x_409_split_axis_0"), val = tensor(1)]; tensor x_409_split_cast_fp16_0, tensor x_409_split_cast_fp16_1 = split(axis = x_409_split_axis_0, num_splits = x_409_split_num_splits_0, x = input_831_cast_fp16)[name = tensor("x_409_split_cast_fp16")]; tensor x_409_split_1_sigmoid_cast_fp16 = sigmoid(x = x_409_split_cast_fp16_1)[name = tensor("x_409_split_1_sigmoid_cast_fp16")]; tensor x_409_cast_fp16 = mul(x = x_409_split_cast_fp16_0, y = x_409_split_1_sigmoid_cast_fp16)[name = tensor("x_409_cast_fp16")]; tensor input_833_cast_fp16 = select(a = var_40_to_fp16, b = x_409_cast_fp16, cond = var_418)[name = tensor("input_833_cast_fp16")]; tensor new_x_63_interleave_0 = const()[name = tensor("new_x_63_interleave_0"), val = tensor(false)]; tensor new_x_63_cast_fp16 = concat(axis = var_62, interleave = new_x_63_interleave_0, values = (cache_63_cast_fp16, input_833_cast_fp16))[name = tensor("new_x_63_cast_fp16")]; tensor next_cache_31_begin_0 = const()[name = tensor("next_cache_31_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_31_end_0 = const()[name = tensor("next_cache_31_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_31_end_mask_0 = const()[name = tensor("next_cache_31_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_31_cast_fp16 = slice_by_index(begin = next_cache_31_begin_0, end = next_cache_31_end_0, end_mask = next_cache_31_end_mask_0, x = new_x_63_cast_fp16)[name = tensor("next_cache_31_cast_fp16")]; tensor var_3539_begin_0 = const()[name = tensor("op_3539_begin_0"), val = tensor([0, 0, 1])]; tensor var_3539_end_0 = const()[name = tensor("op_3539_end_0"), val = tensor([1, 512, 9])]; tensor var_3539_end_mask_0 = const()[name = tensor("op_3539_end_mask_0"), val = tensor([true, true, true])]; tensor var_3539_cast_fp16 = slice_by_index(begin = var_3539_begin_0, end = var_3539_end_0, end_mask = var_3539_end_mask_0, x = next_cache_31_cast_fp16)[name = tensor("op_3539_cast_fp16")]; tensor x_411_pad_type_0 = const()[name = tensor("x_411_pad_type_0"), val = tensor("valid")]; tensor x_411_groups_0 = const()[name = tensor("x_411_groups_0"), val = tensor(512)]; tensor x_411_strides_0 = const()[name = tensor("x_411_strides_0"), val = tensor([1])]; tensor x_411_pad_0 = const()[name = tensor("x_411_pad_0"), val = tensor([0, 0])]; tensor x_411_dilations_0 = const()[name = tensor("x_411_dilations_0"), val = tensor([1])]; tensor encoder_layers_15_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_15_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195724864)))]; tensor x_411_cast_fp16 = conv(dilations = x_411_dilations_0, groups = x_411_groups_0, pad = x_411_pad_0, pad_type = x_411_pad_type_0, strides = x_411_strides_0, weight = encoder_layers_15_conv_depthwise_conv_weight_to_fp16, x = new_x_63_cast_fp16)[name = tensor("x_411_cast_fp16")]; tensor input_835_perm_0 = const()[name = tensor("input_835_perm_0"), val = tensor([0, 2, 1])]; tensor x_413_axes_0 = const()[name = tensor("x_413_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_15_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195734144)))]; tensor encoder_layers_15_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_15_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195735232)))]; tensor input_835_cast_fp16 = transpose(perm = input_835_perm_0, x = x_411_cast_fp16)[name = tensor("transpose_97")]; tensor x_413_cast_fp16 = layer_norm(axes = x_413_axes_0, beta = encoder_layers_15_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_conv_batch_norm_weight_to_fp16, x = input_835_cast_fp16)[name = tensor("x_413_cast_fp16")]; tensor input_837_perm_0 = const()[name = tensor("input_837_perm_0"), val = tensor([0, 2, 1])]; tensor input_837_cast_fp16 = transpose(perm = input_837_perm_0, x = x_413_cast_fp16)[name = tensor("transpose_96")]; tensor input_839_cast_fp16 = silu(x = input_837_cast_fp16)[name = tensor("input_839_cast_fp16")]; tensor x_415_pad_type_0 = const()[name = tensor("x_415_pad_type_0"), val = tensor("valid")]; tensor x_415_strides_0 = const()[name = tensor("x_415_strides_0"), val = tensor([1])]; tensor x_415_pad_0 = const()[name = tensor("x_415_pad_0"), val = tensor([0, 0])]; tensor x_415_dilations_0 = const()[name = tensor("x_415_dilations_0"), val = tensor([1])]; tensor x_415_groups_0 = const()[name = tensor("x_415_groups_0"), val = tensor(1)]; tensor encoder_layers_15_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195736320)))]; tensor x_415_cast_fp16 = conv(dilations = x_415_dilations_0, groups = x_415_groups_0, pad = x_415_pad_0, pad_type = x_415_pad_type_0, strides = x_415_strides_0, weight = encoder_layers_15_conv_pointwise_conv2_weight_to_fp16, x = input_839_cast_fp16)[name = tensor("x_415_cast_fp16")]; tensor input_841_perm_0 = const()[name = tensor("input_841_perm_0"), val = tensor([0, 2, 1])]; tensor input_841_cast_fp16 = transpose(perm = input_841_perm_0, x = x_415_cast_fp16)[name = tensor("transpose_95")]; tensor input_843_cast_fp16 = add(x = input_827_cast_fp16, y = input_841_cast_fp16)[name = tensor("input_843_cast_fp16")]; tensor input_845_axes_0 = const()[name = tensor("input_845_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196260672)))]; tensor encoder_layers_15_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196261760)))]; tensor input_845_cast_fp16 = layer_norm(axes = input_845_axes_0, beta = encoder_layers_15_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_norm_feed_forward2_weight_to_fp16, x = input_843_cast_fp16)[name = tensor("input_845_cast_fp16")]; tensor encoder_layers_15_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196262848)))]; tensor linear_143_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_15_feed_forward2_linear1_weight_to_fp16, x = input_845_cast_fp16)[name = tensor("linear_143_cast_fp16")]; tensor input_849_cast_fp16 = silu(x = linear_143_cast_fp16)[name = tensor("input_849_cast_fp16")]; tensor encoder_layers_15_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_15_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198360064)))]; tensor linear_144_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_15_feed_forward2_linear2_weight_to_fp16, x = input_849_cast_fp16)[name = tensor("linear_144_cast_fp16")]; tensor var_3580_to_fp16 = const()[name = tensor("op_3580_to_fp16"), val = tensor(0x1p-1)]; tensor var_3581_cast_fp16 = mul(x = linear_144_cast_fp16, y = var_3580_to_fp16)[name = tensor("op_3581_cast_fp16")]; tensor input_855_cast_fp16 = add(x = input_843_cast_fp16, y = var_3581_cast_fp16)[name = tensor("input_855_cast_fp16")]; tensor input_857_axes_0 = const()[name = tensor("input_857_axes_0"), val = tensor([-1])]; tensor encoder_layers_15_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_15_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200457280)))]; tensor encoder_layers_15_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_15_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200458368)))]; tensor input_857_cast_fp16 = layer_norm(axes = input_857_axes_0, beta = encoder_layers_15_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_15_norm_out_weight_to_fp16, x = input_855_cast_fp16)[name = tensor("input_857_cast_fp16")]; tensor cache_65_begin_0 = const()[name = tensor("cache_65_begin_0"), val = tensor([16, 0, 0, 0])]; tensor cache_65_end_0 = const()[name = tensor("cache_65_end_0"), val = tensor([17, 1, 70, 512])]; tensor cache_65_end_mask_0 = const()[name = tensor("cache_65_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_65_squeeze_mask_0 = const()[name = tensor("cache_65_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_65_cast_fp16 = slice_by_index(begin = cache_65_begin_0, end = cache_65_end_0, end_mask = cache_65_end_mask_0, squeeze_mask = cache_65_squeeze_mask_0, x = cache_last_channel_to_fp16)[name = tensor("cache_65_cast_fp16")]; tensor cache_begin_0 = const()[name = tensor("cache_begin_0"), val = tensor([16, 0, 0, 0])]; tensor cache_end_0 = const()[name = tensor("cache_end_0"), val = tensor([17, 1, 512, 8])]; tensor cache_end_mask_0 = const()[name = tensor("cache_end_mask_0"), val = tensor([false, true, true, true])]; tensor cache_squeeze_mask_0 = const()[name = tensor("cache_squeeze_mask_0"), val = tensor([true, false, false, false])]; tensor cache_cast_fp16 = slice_by_index(begin = cache_begin_0, end = cache_end_0, end_mask = cache_end_mask_0, squeeze_mask = cache_squeeze_mask_0, x = cache_last_time_to_fp16)[name = tensor("cache_cast_fp16")]; tensor input_859_axes_0 = const()[name = tensor("input_859_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_feed_forward1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200459456)))]; tensor encoder_layers_16_norm_feed_forward1_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200460544)))]; tensor input_859_cast_fp16 = layer_norm(axes = input_859_axes_0, beta = encoder_layers_16_norm_feed_forward1_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_norm_feed_forward1_weight_to_fp16, x = input_857_cast_fp16)[name = tensor("input_859_cast_fp16")]; tensor encoder_layers_16_feed_forward1_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward1_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200461632)))]; tensor linear_145_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_16_feed_forward1_linear1_weight_to_fp16, x = input_859_cast_fp16)[name = tensor("linear_145_cast_fp16")]; tensor input_863_cast_fp16 = silu(x = linear_145_cast_fp16)[name = tensor("input_863_cast_fp16")]; tensor encoder_layers_16_feed_forward1_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward1_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202558848)))]; tensor linear_146_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_feed_forward1_linear2_weight_to_fp16, x = input_863_cast_fp16)[name = tensor("linear_146_cast_fp16")]; tensor var_3615_to_fp16 = const()[name = tensor("op_3615_to_fp16"), val = tensor(0x1p-1)]; tensor var_3616_cast_fp16 = mul(x = linear_146_cast_fp16, y = var_3615_to_fp16)[name = tensor("op_3616_cast_fp16")]; tensor input_869_cast_fp16 = add(x = input_857_cast_fp16, y = var_3616_cast_fp16)[name = tensor("input_869_cast_fp16")]; tensor key_axes_0 = const()[name = tensor("key_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_self_att_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_self_att_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204656064)))]; tensor encoder_layers_16_norm_self_att_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_self_att_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204657152)))]; tensor key_cast_fp16 = layer_norm(axes = key_axes_0, beta = encoder_layers_16_norm_self_att_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_norm_self_att_weight_to_fp16, x = input_869_cast_fp16)[name = tensor("key_cast_fp16")]; tensor input_871_interleave_0 = const()[name = tensor("input_871_interleave_0"), val = tensor(false)]; tensor input_871_cast_fp16 = concat(axis = var_64, interleave = input_871_interleave_0, values = (cache_65_cast_fp16, key_cast_fp16))[name = tensor("input_871_cast_fp16")]; tensor var_3638_begin_0 = const()[name = tensor("op_3638_begin_0"), val = tensor([0, 1, 0])]; tensor var_3638_end_0 = const()[name = tensor("op_3638_end_0"), val = tensor([1, 70, 512])]; tensor var_3638_end_mask_0 = const()[name = tensor("op_3638_end_mask_0"), val = tensor([true, true, true])]; tensor var_3638_cast_fp16 = slice_by_index(begin = var_3638_begin_0, end = var_3638_end_0, end_mask = var_3638_end_mask_0, x = cache_65_cast_fp16)[name = tensor("op_3638_cast_fp16")]; tensor var_3641_begin_0 = const()[name = tensor("op_3641_begin_0"), val = tensor([0, 0, 0])]; tensor var_3641_end_0 = const()[name = tensor("op_3641_end_0"), val = tensor([1, 1, 512])]; tensor var_3641_end_mask_0 = const()[name = tensor("op_3641_end_mask_0"), val = tensor([true, false, true])]; tensor var_3641_cast_fp16 = slice_by_index(begin = var_3641_begin_0, end = var_3641_end_0, end_mask = var_3641_end_mask_0, x = key_cast_fp16)[name = tensor("op_3641_cast_fp16")]; tensor cache_last_channel_cur_interleave_0 = const()[name = tensor("cache_last_channel_cur_interleave_0"), val = tensor(false)]; tensor cache_last_channel_cur_cast_fp16 = concat(axis = var_64, interleave = cache_last_channel_cur_interleave_0, values = (var_3638_cast_fp16, var_3641_cast_fp16))[name = tensor("cache_last_channel_cur_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_q_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204658240)))]; tensor linear_147_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_self_attn_linear_q_weight_to_fp16, x = key_cast_fp16)[name = tensor("linear_147_cast_fp16")]; tensor var_3648 = const()[name = tensor("op_3648"), val = tensor([1, -1, 8, 64])]; tensor q_97_cast_fp16 = reshape(shape = var_3648, x = linear_147_cast_fp16)[name = tensor("q_97_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_k_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205182592)))]; tensor linear_148_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_self_attn_linear_k_weight_to_fp16, x = input_871_cast_fp16)[name = tensor("linear_148_cast_fp16")]; tensor var_3652 = const()[name = tensor("op_3652"), val = tensor([1, -1, 8, 64])]; tensor k_65_cast_fp16 = reshape(shape = var_3652, x = linear_148_cast_fp16)[name = tensor("k_65_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_v_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(205706944)))]; tensor linear_149_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_self_attn_linear_v_weight_to_fp16, x = input_871_cast_fp16)[name = tensor("linear_149_cast_fp16")]; tensor var_3656 = const()[name = tensor("op_3656"), val = tensor([1, -1, 8, 64])]; tensor v_cast_fp16 = reshape(shape = var_3656, x = linear_149_cast_fp16)[name = tensor("v_cast_fp16")]; tensor value_perm_0 = const()[name = tensor("value_perm_0"), val = tensor([0, 2, 1, 3])]; tensor encoder_layers_16_self_attn_pos_bias_u_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_pos_bias_u_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206231296)))]; tensor var_3668_cast_fp16 = add(x = q_97_cast_fp16, y = encoder_layers_16_self_attn_pos_bias_u_to_fp16)[name = tensor("op_3668_cast_fp16")]; tensor encoder_layers_16_self_attn_pos_bias_v_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_pos_bias_v_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206232384)))]; tensor var_3670_cast_fp16 = add(x = q_97_cast_fp16, y = encoder_layers_16_self_attn_pos_bias_v_to_fp16)[name = tensor("op_3670_cast_fp16")]; tensor q_with_bias_v_perm_0 = const()[name = tensor("q_with_bias_v_perm_0"), val = tensor([0, 2, 1, 3])]; tensor x_423_transpose_x_0 = const()[name = tensor("x_423_transpose_x_0"), val = tensor(false)]; tensor x_423_transpose_y_0 = const()[name = tensor("x_423_transpose_y_0"), val = tensor(false)]; tensor var_3672_to_fp16 = const()[name = tensor("op_3672_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206233472)))]; tensor q_with_bias_v_cast_fp16 = transpose(perm = q_with_bias_v_perm_0, x = var_3670_cast_fp16)[name = tensor("transpose_93")]; tensor x_423_cast_fp16 = matmul(transpose_x = x_423_transpose_x_0, transpose_y = x_423_transpose_y_0, x = q_with_bias_v_cast_fp16, y = var_3672_to_fp16)[name = tensor("x_423_cast_fp16")]; tensor x_425_pad_0 = const()[name = tensor("x_425_pad_0"), val = tensor([0, 0, 0, 0, 0, 0, 1, 0])]; tensor x_425_mode_0 = const()[name = tensor("x_425_mode_0"), val = tensor("constant")]; tensor const_231_to_fp16 = const()[name = tensor("const_231_to_fp16"), val = tensor(0x0p+0)]; tensor x_425_cast_fp16 = pad(constant_val = const_231_to_fp16, mode = x_425_mode_0, pad = x_425_pad_0, x = x_423_cast_fp16)[name = tensor("x_425_cast_fp16")]; tensor var_3680 = const()[name = tensor("op_3680"), val = tensor([1, 8, -1, 3])]; tensor x_427_cast_fp16 = reshape(shape = var_3680, x = x_425_cast_fp16)[name = tensor("x_427_cast_fp16")]; tensor var_3684_begin_0 = const()[name = tensor("op_3684_begin_0"), val = tensor([0, 0, 1, 0])]; tensor var_3684_end_0 = const()[name = tensor("op_3684_end_0"), val = tensor([1, 8, 146, 3])]; tensor var_3684_end_mask_0 = const()[name = tensor("op_3684_end_mask_0"), val = tensor([true, true, true, true])]; tensor var_3684_cast_fp16 = slice_by_index(begin = var_3684_begin_0, end = var_3684_end_0, end_mask = var_3684_end_mask_0, x = x_427_cast_fp16)[name = tensor("op_3684_cast_fp16")]; tensor var_3685 = const()[name = tensor("op_3685"), val = tensor([1, 8, 3, 145])]; tensor matrix_bd_65_cast_fp16 = reshape(shape = var_3685, x = var_3684_cast_fp16)[name = tensor("matrix_bd_65_cast_fp16")]; tensor matrix_ac_transpose_x_0 = const()[name = tensor("matrix_ac_transpose_x_0"), val = tensor(false)]; tensor matrix_ac_transpose_y_0 = const()[name = tensor("matrix_ac_transpose_y_0"), val = tensor(false)]; tensor transpose_83_perm_0 = const()[name = tensor("transpose_83_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_84_perm_0 = const()[name = tensor("transpose_84_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_84 = transpose(perm = transpose_84_perm_0, x = k_65_cast_fp16)[name = tensor("transpose_91")]; tensor transpose_83 = transpose(perm = transpose_83_perm_0, x = var_3668_cast_fp16)[name = tensor("transpose_92")]; tensor matrix_ac_cast_fp16 = matmul(transpose_x = matrix_ac_transpose_x_0, transpose_y = matrix_ac_transpose_y_0, x = transpose_83, y = transpose_84)[name = tensor("matrix_ac_cast_fp16")]; tensor matrix_bd_begin_0 = const()[name = tensor("matrix_bd_begin_0"), val = tensor([0, 0, 0, 0])]; tensor matrix_bd_end_0 = const()[name = tensor("matrix_bd_end_0"), val = tensor([1, 8, 3, 73])]; tensor matrix_bd_end_mask_0 = const()[name = tensor("matrix_bd_end_mask_0"), val = tensor([true, true, true, false])]; tensor matrix_bd_cast_fp16 = slice_by_index(begin = matrix_bd_begin_0, end = matrix_bd_end_0, end_mask = matrix_bd_end_mask_0, x = matrix_bd_65_cast_fp16)[name = tensor("matrix_bd_cast_fp16")]; tensor var_3694_cast_fp16 = add(x = matrix_ac_cast_fp16, y = matrix_bd_cast_fp16)[name = tensor("op_3694_cast_fp16")]; tensor _inversed_scores_65_y_0_to_fp16 = const()[name = tensor("_inversed_scores_65_y_0_to_fp16"), val = tensor(0x1p-3)]; tensor _inversed_scores_65_cast_fp16 = mul(x = var_3694_cast_fp16, y = _inversed_scores_65_y_0_to_fp16)[name = tensor("_inversed_scores_65_cast_fp16")]; tensor scores_cast_fp16 = select(a = var_41_to_fp16, b = _inversed_scores_65_cast_fp16, cond = mask_3)[name = tensor("scores_cast_fp16")]; tensor var_3700_cast_fp16 = softmax(axis = var_62, x = scores_cast_fp16)[name = tensor("op_3700_cast_fp16")]; tensor input_873_cast_fp16 = select(a = var_40_to_fp16, b = var_3700_cast_fp16, cond = mask_3)[name = tensor("input_873_cast_fp16")]; tensor x_429_transpose_x_0 = const()[name = tensor("x_429_transpose_x_0"), val = tensor(false)]; tensor x_429_transpose_y_0 = const()[name = tensor("x_429_transpose_y_0"), val = tensor(false)]; tensor value_cast_fp16 = transpose(perm = value_perm_0, x = v_cast_fp16)[name = tensor("transpose_94")]; tensor x_429_cast_fp16 = matmul(transpose_x = x_429_transpose_x_0, transpose_y = x_429_transpose_y_0, x = input_873_cast_fp16, y = value_cast_fp16)[name = tensor("x_429_cast_fp16")]; tensor var_3704_perm_0 = const()[name = tensor("op_3704_perm_0"), val = tensor([0, 2, 1, 3])]; tensor var_3705 = const()[name = tensor("op_3705"), val = tensor([1, -1, 512])]; tensor var_3704_cast_fp16 = transpose(perm = var_3704_perm_0, x = x_429_cast_fp16)[name = tensor("transpose_90")]; tensor input_875_cast_fp16 = reshape(shape = var_3705, x = var_3704_cast_fp16)[name = tensor("input_875_cast_fp16")]; tensor encoder_layers_16_self_attn_linear_out_weight_to_fp16 = const()[name = tensor("encoder_layers_16_self_attn_linear_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206382016)))]; tensor linear_151_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_self_attn_linear_out_weight_to_fp16, x = input_875_cast_fp16)[name = tensor("linear_151_cast_fp16")]; tensor input_879_cast_fp16 = add(x = input_869_cast_fp16, y = linear_151_cast_fp16)[name = tensor("input_879_cast_fp16")]; tensor x_433_axes_0 = const()[name = tensor("x_433_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206906368)))]; tensor encoder_layers_16_norm_conv_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206907456)))]; tensor x_433_cast_fp16 = layer_norm(axes = x_433_axes_0, beta = encoder_layers_16_norm_conv_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_norm_conv_weight_to_fp16, x = input_879_cast_fp16)[name = tensor("x_433_cast_fp16")]; tensor input_881_perm_0 = const()[name = tensor("input_881_perm_0"), val = tensor([0, 2, 1])]; tensor input_883_pad_type_0 = const()[name = tensor("input_883_pad_type_0"), val = tensor("valid")]; tensor input_883_strides_0 = const()[name = tensor("input_883_strides_0"), val = tensor([1])]; tensor input_883_pad_0 = const()[name = tensor("input_883_pad_0"), val = tensor([0, 0])]; tensor input_883_dilations_0 = const()[name = tensor("input_883_dilations_0"), val = tensor([1])]; tensor input_883_groups_0 = const()[name = tensor("input_883_groups_0"), val = tensor(1)]; tensor encoder_layers_16_conv_pointwise_conv1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_conv_pointwise_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(206908544)))]; tensor input_881_cast_fp16 = transpose(perm = input_881_perm_0, x = x_433_cast_fp16)[name = tensor("transpose_89")]; tensor input_883_cast_fp16 = conv(dilations = input_883_dilations_0, groups = input_883_groups_0, pad = input_883_pad_0, pad_type = input_883_pad_type_0, strides = input_883_strides_0, weight = encoder_layers_16_conv_pointwise_conv1_weight_to_fp16, x = input_881_cast_fp16)[name = tensor("input_883_cast_fp16")]; tensor x_435_split_num_splits_0 = const()[name = tensor("x_435_split_num_splits_0"), val = tensor(2)]; tensor x_435_split_axis_0 = const()[name = tensor("x_435_split_axis_0"), val = tensor(1)]; tensor x_435_split_cast_fp16_0, tensor x_435_split_cast_fp16_1 = split(axis = x_435_split_axis_0, num_splits = x_435_split_num_splits_0, x = input_883_cast_fp16)[name = tensor("x_435_split_cast_fp16")]; tensor x_435_split_1_sigmoid_cast_fp16 = sigmoid(x = x_435_split_cast_fp16_1)[name = tensor("x_435_split_1_sigmoid_cast_fp16")]; tensor x_435_cast_fp16 = mul(x = x_435_split_cast_fp16_0, y = x_435_split_1_sigmoid_cast_fp16)[name = tensor("x_435_cast_fp16")]; tensor input_885_cast_fp16 = select(a = var_40_to_fp16, b = x_435_cast_fp16, cond = var_418)[name = tensor("input_885_cast_fp16")]; tensor new_x_interleave_0 = const()[name = tensor("new_x_interleave_0"), val = tensor(false)]; tensor new_x_cast_fp16 = concat(axis = var_62, interleave = new_x_interleave_0, values = (cache_cast_fp16, input_885_cast_fp16))[name = tensor("new_x_cast_fp16")]; tensor next_cache_begin_0 = const()[name = tensor("next_cache_begin_0"), val = tensor([0, 0, 0])]; tensor next_cache_end_0 = const()[name = tensor("next_cache_end_0"), val = tensor([1, 512, 9])]; tensor next_cache_end_mask_0 = const()[name = tensor("next_cache_end_mask_0"), val = tensor([true, true, false])]; tensor next_cache_cast_fp16 = slice_by_index(begin = next_cache_begin_0, end = next_cache_end_0, end_mask = next_cache_end_mask_0, x = new_x_cast_fp16)[name = tensor("next_cache_cast_fp16")]; tensor cache_last_time_cur_begin_0 = const()[name = tensor("cache_last_time_cur_begin_0"), val = tensor([0, 0, 1])]; tensor cache_last_time_cur_end_0 = const()[name = tensor("cache_last_time_cur_end_0"), val = tensor([1, 512, 9])]; tensor cache_last_time_cur_end_mask_0 = const()[name = tensor("cache_last_time_cur_end_mask_0"), val = tensor([true, true, true])]; tensor cache_last_time_cur_cast_fp16 = slice_by_index(begin = cache_last_time_cur_begin_0, end = cache_last_time_cur_end_0, end_mask = cache_last_time_cur_end_mask_0, x = next_cache_cast_fp16)[name = tensor("cache_last_time_cur_cast_fp16")]; tensor x_437_pad_type_0 = const()[name = tensor("x_437_pad_type_0"), val = tensor("valid")]; tensor x_437_groups_0 = const()[name = tensor("x_437_groups_0"), val = tensor(512)]; tensor x_437_strides_0 = const()[name = tensor("x_437_strides_0"), val = tensor([1])]; tensor x_437_pad_0 = const()[name = tensor("x_437_pad_0"), val = tensor([0, 0])]; tensor x_437_dilations_0 = const()[name = tensor("x_437_dilations_0"), val = tensor([1])]; tensor encoder_layers_16_conv_depthwise_conv_weight_to_fp16 = const()[name = tensor("encoder_layers_16_conv_depthwise_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207957184)))]; tensor x_437_cast_fp16 = conv(dilations = x_437_dilations_0, groups = x_437_groups_0, pad = x_437_pad_0, pad_type = x_437_pad_type_0, strides = x_437_strides_0, weight = encoder_layers_16_conv_depthwise_conv_weight_to_fp16, x = new_x_cast_fp16)[name = tensor("x_437_cast_fp16")]; tensor input_887_perm_0 = const()[name = tensor("input_887_perm_0"), val = tensor([0, 2, 1])]; tensor x_439_axes_0 = const()[name = tensor("x_439_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_conv_batch_norm_weight_to_fp16 = const()[name = tensor("encoder_layers_16_conv_batch_norm_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207966464)))]; tensor encoder_layers_16_conv_batch_norm_bias_to_fp16 = const()[name = tensor("encoder_layers_16_conv_batch_norm_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207967552)))]; tensor input_887_cast_fp16 = transpose(perm = input_887_perm_0, x = x_437_cast_fp16)[name = tensor("transpose_88")]; tensor x_439_cast_fp16 = layer_norm(axes = x_439_axes_0, beta = encoder_layers_16_conv_batch_norm_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_conv_batch_norm_weight_to_fp16, x = input_887_cast_fp16)[name = tensor("x_439_cast_fp16")]; tensor input_889_perm_0 = const()[name = tensor("input_889_perm_0"), val = tensor([0, 2, 1])]; tensor input_889_cast_fp16 = transpose(perm = input_889_perm_0, x = x_439_cast_fp16)[name = tensor("transpose_87")]; tensor input_891_cast_fp16 = silu(x = input_889_cast_fp16)[name = tensor("input_891_cast_fp16")]; tensor x_441_pad_type_0 = const()[name = tensor("x_441_pad_type_0"), val = tensor("valid")]; tensor x_441_strides_0 = const()[name = tensor("x_441_strides_0"), val = tensor([1])]; tensor x_441_pad_0 = const()[name = tensor("x_441_pad_0"), val = tensor([0, 0])]; tensor x_441_dilations_0 = const()[name = tensor("x_441_dilations_0"), val = tensor([1])]; tensor x_441_groups_0 = const()[name = tensor("x_441_groups_0"), val = tensor(1)]; tensor encoder_layers_16_conv_pointwise_conv2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_conv_pointwise_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207968640)))]; tensor x_441_cast_fp16 = conv(dilations = x_441_dilations_0, groups = x_441_groups_0, pad = x_441_pad_0, pad_type = x_441_pad_type_0, strides = x_441_strides_0, weight = encoder_layers_16_conv_pointwise_conv2_weight_to_fp16, x = input_891_cast_fp16)[name = tensor("x_441_cast_fp16")]; tensor input_893_perm_0 = const()[name = tensor("input_893_perm_0"), val = tensor([0, 2, 1])]; tensor input_893_cast_fp16 = transpose(perm = input_893_perm_0, x = x_441_cast_fp16)[name = tensor("transpose_86")]; tensor input_895_cast_fp16 = add(x = input_879_cast_fp16, y = input_893_cast_fp16)[name = tensor("input_895_cast_fp16")]; tensor input_897_axes_0 = const()[name = tensor("input_897_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_feed_forward2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208492992)))]; tensor encoder_layers_16_norm_feed_forward2_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_feed_forward2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208494080)))]; tensor input_897_cast_fp16 = layer_norm(axes = input_897_axes_0, beta = encoder_layers_16_norm_feed_forward2_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_norm_feed_forward2_weight_to_fp16, x = input_895_cast_fp16)[name = tensor("input_897_cast_fp16")]; tensor encoder_layers_16_feed_forward2_linear1_weight_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward2_linear1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(208495168)))]; tensor linear_152_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = encoder_layers_16_feed_forward2_linear1_weight_to_fp16, x = input_897_cast_fp16)[name = tensor("linear_152_cast_fp16")]; tensor input_901_cast_fp16 = silu(x = linear_152_cast_fp16)[name = tensor("input_901_cast_fp16")]; tensor encoder_layers_16_feed_forward2_linear2_weight_to_fp16 = const()[name = tensor("encoder_layers_16_feed_forward2_linear2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(210592384)))]; tensor linear_153_cast_fp16 = linear(bias = linear_2_bias_0_to_fp16, weight = encoder_layers_16_feed_forward2_linear2_weight_to_fp16, x = input_901_cast_fp16)[name = tensor("linear_153_cast_fp16")]; tensor var_3787_to_fp16 = const()[name = tensor("op_3787_to_fp16"), val = tensor(0x1p-1)]; tensor var_3788_cast_fp16 = mul(x = linear_153_cast_fp16, y = var_3787_to_fp16)[name = tensor("op_3788_cast_fp16")]; tensor input_cast_fp16 = add(x = input_895_cast_fp16, y = var_3788_cast_fp16)[name = tensor("input_cast_fp16")]; tensor audio_signal_axes_0 = const()[name = tensor("audio_signal_axes_0"), val = tensor([-1])]; tensor encoder_layers_16_norm_out_weight_to_fp16 = const()[name = tensor("encoder_layers_16_norm_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212689600)))]; tensor encoder_layers_16_norm_out_bias_to_fp16 = const()[name = tensor("encoder_layers_16_norm_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(212690688)))]; tensor audio_signal_cast_fp16 = layer_norm(axes = audio_signal_axes_0, beta = encoder_layers_16_norm_out_bias_to_fp16, epsilon = var_38_to_fp16, gamma = encoder_layers_16_norm_out_weight_to_fp16, x = input_cast_fp16)[name = tensor("audio_signal_cast_fp16")]; tensor obj_1_perm_0 = const()[name = tensor("obj_1_perm_0"), val = tensor([0, 2, 1])]; tensor cast_178_dtype_0 = const()[name = tensor("cast_178_dtype_0"), val = tensor("int32")]; tensor obj_5_axis_0 = const()[name = tensor("obj_5_axis_0"), val = tensor(0)]; tensor obj_5_cast_fp16 = stack(axis = obj_5_axis_0, values = (var_332_cast_fp16, var_539_cast_fp16, var_746_cast_fp16, var_953_cast_fp16, var_1160_cast_fp16, var_1367_cast_fp16, var_1574_cast_fp16, var_1781_cast_fp16, var_1988_cast_fp16, var_2195_cast_fp16, var_2402_cast_fp16, var_2609_cast_fp16, var_2816_cast_fp16, var_3023_cast_fp16, var_3230_cast_fp16, var_3437_cast_fp16, cache_last_channel_cur_cast_fp16))[name = tensor("obj_5_cast_fp16")]; tensor obj_7_axis_0 = const()[name = tensor("obj_7_axis_0"), val = tensor(0)]; tensor obj_7_cast_fp16 = stack(axis = obj_7_axis_0, values = (var_434_cast_fp16, var_641_cast_fp16, var_848_cast_fp16, var_1055_cast_fp16, var_1262_cast_fp16, var_1469_cast_fp16, var_1676_cast_fp16, var_1883_cast_fp16, var_2090_cast_fp16, var_2297_cast_fp16, var_2504_cast_fp16, var_2711_cast_fp16, var_2918_cast_fp16, var_3125_cast_fp16, var_3332_cast_fp16, var_3539_cast_fp16, cache_last_time_cur_cast_fp16))[name = tensor("obj_7_cast_fp16")]; tensor obj_7_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("obj_7_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_3804 = add(x = cache_last_channel_len, y = cache_keep_size)[name = tensor("op_3804")]; tensor var_3804_promoted_to_fp16_dtype_0 = const()[name = tensor("op_3804_promoted_to_fp16_dtype_0"), val = tensor("fp16")]; tensor const_237_to_fp16 = const()[name = tensor("const_237_to_fp16"), val = tensor(-inf)]; tensor var_45_promoted_to_fp16 = const()[name = tensor("op_45_promoted_to_fp16"), val = tensor(0x1.18p+6)]; tensor var_3804_to_fp16 = cast(dtype = var_3804_promoted_to_fp16_dtype_0, x = var_3804)[name = tensor("cast_186")]; tensor clip_1_cast_fp16 = clip(alpha = const_237_to_fp16, beta = var_45_promoted_to_fp16, x = var_3804_to_fp16)[name = tensor("clip_1_cast_fp16")]; tensor var_3831_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_3831_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_3846_begin_0 = const()[name = tensor("op_3846_begin_0"), val = tensor([0, 0, 0])]; tensor var_3846_end_0 = const()[name = tensor("op_3846_end_0"), val = tensor([1, 512, 2])]; tensor var_3846_end_mask_0 = const()[name = tensor("op_3846_end_mask_0"), val = tensor([true, true, false])]; tensor obj_1_cast_fp16 = transpose(perm = obj_1_perm_0, x = audio_signal_cast_fp16)[name = tensor("transpose_85")]; tensor var_3846_cast_fp16 = slice_by_index(begin = var_3846_begin_0, end = var_3846_end_0, end_mask = var_3846_end_mask_0, x = obj_1_cast_fp16)[name = tensor("op_3846_cast_fp16")]; tensor var_3846_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_3846_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor cast_178_promoted_to_fp16_dtype_0 = const()[name = tensor("cast_178_promoted_to_fp16_dtype_0"), val = tensor("fp16")]; tensor const_238_to_fp16 = const()[name = tensor("const_238_to_fp16"), val = tensor(-inf)]; tensor var_3848_promoted_to_fp16 = const()[name = tensor("op_3848_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor clip_0_cast_fp16_to_int32 = cast(dtype = cast_178_dtype_0, x = clip_0_cast_fp16)[name = tensor("cast_188")]; tensor clip_0_cast_fp16_to_int32_to_fp16 = cast(dtype = cast_178_promoted_to_fp16_dtype_0, x = clip_0_cast_fp16_to_int32)[name = tensor("cast_183")]; tensor clip_2_cast_fp16 = clip(alpha = const_238_to_fp16, beta = var_3848_promoted_to_fp16, x = clip_0_cast_fp16_to_int32_to_fp16)[name = tensor("clip_2_cast_fp16")]; tensor cast_179_dtype_0 = const()[name = tensor("cast_179_dtype_0"), val = tensor("int32")]; tensor cast_180_dtype_0 = const()[name = tensor("cast_180_dtype_0"), val = tensor("int32")]; tensor new_cache_last_channel_len = cast(dtype = cast_180_dtype_0, x = clip_1_cast_fp16)[name = tensor("cast_181")]; tensor encoded_length = cast(dtype = cast_179_dtype_0, x = clip_2_cast_fp16)[name = tensor("cast_182")]; tensor encoded_output = cast(dtype = var_3846_cast_fp16_to_fp32_dtype_0, x = var_3846_cast_fp16)[name = tensor("cast_184")]; tensor new_cache_last_channel = cast(dtype = var_3831_cast_fp16_to_fp32_dtype_0, x = obj_5_cast_fp16)[name = tensor("cast_185")]; tensor new_cache_last_time = cast(dtype = obj_7_cast_fp16_to_fp32_dtype_0, x = obj_7_cast_fp16)[name = tensor("cast_187")]; tensor new_pre_cache = cast(dtype = var_28_cast_fp16_to_fp32_dtype_0, x = var_28_cast_fp16)[name = tensor("cast_194")]; } -> (encoded_output, encoded_length, new_pre_cache, new_cache_last_channel, new_cache_last_time, new_cache_last_channel_len); }